1 /*
2  * Copyright 2015 Red Hat Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  * Authors: Ben Skeggs <bskeggs@redhat.com>
23  */
24 #include "gf100.h"
25 #include "ctxgf100.h"
26 
27 #include <subdev/secboot.h>
28 
29 #include <nvif/class.h>
30 
31 /*******************************************************************************
32  * PGRAPH engine/subdev functions
33  ******************************************************************************/
34 
35 int
36 gm200_gr_rops(struct gf100_gr *gr)
37 {
38 	return nvkm_rd32(gr->base.engine.subdev.device, 0x12006c);
39 }
40 
41 void
42 gm200_gr_init_gpc_mmu(struct gf100_gr *gr)
43 {
44 	struct nvkm_device *device = gr->base.engine.subdev.device;
45 
46 	nvkm_wr32(device, 0x418880, nvkm_rd32(device, 0x100c80) & 0xf0001fff);
47 	nvkm_wr32(device, 0x418890, 0x00000000);
48 	nvkm_wr32(device, 0x418894, 0x00000000);
49 
50 	nvkm_wr32(device, 0x4188b4, nvkm_rd32(device, 0x100cc8));
51 	nvkm_wr32(device, 0x4188b8, nvkm_rd32(device, 0x100ccc));
52 	nvkm_wr32(device, 0x4188b0, nvkm_rd32(device, 0x100cc4));
53 }
54 
55 static void
56 gm200_gr_init_rop_active_fbps(struct gf100_gr *gr)
57 {
58 	struct nvkm_device *device = gr->base.engine.subdev.device;
59 	const u32 fbp_count = nvkm_rd32(device, 0x12006c);
60 	nvkm_mask(device, 0x408850, 0x0000000f, fbp_count); /* zrop */
61 	nvkm_mask(device, 0x408958, 0x0000000f, fbp_count); /* crop */
62 }
63 
64 int
65 gm200_gr_init(struct gf100_gr *gr)
66 {
67 	struct nvkm_device *device = gr->base.engine.subdev.device;
68 	const u32 magicgpc918 = DIV_ROUND_UP(0x00800000, gr->tpc_total);
69 	u32 data[TPC_MAX / 8] = {};
70 	u8  tpcnr[GPC_MAX];
71 	int gpc, tpc, rop;
72 	int i;
73 
74 	gr->func->init_gpc_mmu(gr);
75 
76 	gf100_gr_mmio(gr, gr->fuc_sw_nonctx);
77 
78 	gm107_gr_init_bios(gr);
79 
80 	nvkm_wr32(device, GPC_UNIT(0, 0x3018), 0x00000001);
81 
82 	memset(data, 0x00, sizeof(data));
83 	memcpy(tpcnr, gr->tpc_nr, sizeof(gr->tpc_nr));
84 	for (i = 0, gpc = -1; i < gr->tpc_total; i++) {
85 		do {
86 			gpc = (gpc + 1) % gr->gpc_nr;
87 		} while (!tpcnr[gpc]);
88 		tpc = gr->tpc_nr[gpc] - tpcnr[gpc]--;
89 
90 		data[i / 8] |= tpc << ((i % 8) * 4);
91 	}
92 
93 	nvkm_wr32(device, GPC_BCAST(0x0980), data[0]);
94 	nvkm_wr32(device, GPC_BCAST(0x0984), data[1]);
95 	nvkm_wr32(device, GPC_BCAST(0x0988), data[2]);
96 	nvkm_wr32(device, GPC_BCAST(0x098c), data[3]);
97 
98 	for (gpc = 0; gpc < gr->gpc_nr; gpc++) {
99 		nvkm_wr32(device, GPC_UNIT(gpc, 0x0914),
100 			  gr->screen_tile_row_offset << 8 | gr->tpc_nr[gpc]);
101 		nvkm_wr32(device, GPC_UNIT(gpc, 0x0910), 0x00040000 |
102 							 gr->tpc_total);
103 		nvkm_wr32(device, GPC_UNIT(gpc, 0x0918), magicgpc918);
104 	}
105 
106 	nvkm_wr32(device, GPC_BCAST(0x3fd4), magicgpc918);
107 	nvkm_wr32(device, GPC_BCAST(0x08ac), nvkm_rd32(device, 0x100800));
108 	nvkm_wr32(device, GPC_BCAST(0x033c), nvkm_rd32(device, 0x100804));
109 
110 	gr->func->init_rop_active_fbps(gr);
111 
112 	nvkm_wr32(device, 0x400500, 0x00010001);
113 	nvkm_wr32(device, 0x400100, 0xffffffff);
114 	nvkm_wr32(device, 0x40013c, 0xffffffff);
115 	nvkm_wr32(device, 0x400124, 0x00000002);
116 	nvkm_wr32(device, 0x409c24, 0x000e0000);
117 	nvkm_wr32(device, 0x405848, 0xc0000000);
118 	nvkm_wr32(device, 0x40584c, 0x00000001);
119 	nvkm_wr32(device, 0x404000, 0xc0000000);
120 	nvkm_wr32(device, 0x404600, 0xc0000000);
121 	nvkm_wr32(device, 0x408030, 0xc0000000);
122 	nvkm_wr32(device, 0x404490, 0xc0000000);
123 	nvkm_wr32(device, 0x406018, 0xc0000000);
124 	nvkm_wr32(device, 0x407020, 0x40000000);
125 	nvkm_wr32(device, 0x405840, 0xc0000000);
126 	nvkm_wr32(device, 0x405844, 0x00ffffff);
127 	nvkm_mask(device, 0x419cc0, 0x00000008, 0x00000008);
128 
129 	gr->func->init_ppc_exceptions(gr);
130 
131 	for (gpc = 0; gpc < gr->gpc_nr; gpc++) {
132 		nvkm_wr32(device, GPC_UNIT(gpc, 0x0420), 0xc0000000);
133 		nvkm_wr32(device, GPC_UNIT(gpc, 0x0900), 0xc0000000);
134 		nvkm_wr32(device, GPC_UNIT(gpc, 0x1028), 0xc0000000);
135 		nvkm_wr32(device, GPC_UNIT(gpc, 0x0824), 0xc0000000);
136 		for (tpc = 0; tpc < gr->tpc_nr[gpc]; tpc++) {
137 			nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x508), 0xffffffff);
138 			nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x50c), 0xffffffff);
139 			nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x224), 0xc0000000);
140 			nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x48c), 0xc0000000);
141 			nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x084), 0xc0000000);
142 			nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x430), 0xc0000000);
143 			nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x644), 0x00dffffe);
144 			nvkm_wr32(device, TPC_UNIT(gpc, tpc, 0x64c), 0x00000005);
145 		}
146 		nvkm_wr32(device, GPC_UNIT(gpc, 0x2c90), 0xffffffff);
147 		nvkm_wr32(device, GPC_UNIT(gpc, 0x2c94), 0xffffffff);
148 	}
149 
150 	for (rop = 0; rop < gr->rop_nr; rop++) {
151 		nvkm_wr32(device, ROP_UNIT(rop, 0x144), 0x40000000);
152 		nvkm_wr32(device, ROP_UNIT(rop, 0x070), 0x40000000);
153 		nvkm_wr32(device, ROP_UNIT(rop, 0x204), 0xffffffff);
154 		nvkm_wr32(device, ROP_UNIT(rop, 0x208), 0xffffffff);
155 	}
156 
157 	nvkm_wr32(device, 0x400108, 0xffffffff);
158 	nvkm_wr32(device, 0x400138, 0xffffffff);
159 	nvkm_wr32(device, 0x400118, 0xffffffff);
160 	nvkm_wr32(device, 0x400130, 0xffffffff);
161 	nvkm_wr32(device, 0x40011c, 0xffffffff);
162 	nvkm_wr32(device, 0x400134, 0xffffffff);
163 
164 	nvkm_wr32(device, 0x400054, 0x2c350f63);
165 
166 	gf100_gr_zbc_init(gr);
167 
168 	return gf100_gr_init_ctxctl(gr);
169 }
170 
171 int
172 gm200_gr_new_(const struct gf100_gr_func *func, struct nvkm_device *device,
173 	      int index, struct nvkm_gr **pgr)
174 {
175 	struct gf100_gr *gr;
176 	int ret;
177 
178 	if (!(gr = kzalloc(sizeof(*gr), GFP_KERNEL)))
179 		return -ENOMEM;
180 	*pgr = &gr->base;
181 
182 	ret = gf100_gr_ctor(func, device, index, gr);
183 	if (ret)
184 		return ret;
185 
186 	/* Load firmwares for non-secure falcons */
187 	if (!nvkm_secboot_is_managed(device->secboot,
188 				     NVKM_SECBOOT_FALCON_FECS)) {
189 		if ((ret = gf100_gr_ctor_fw(gr, "gr/fecs_inst", &gr->fuc409c)) ||
190 		    (ret = gf100_gr_ctor_fw(gr, "gr/fecs_data", &gr->fuc409d)))
191 			return ret;
192 	}
193 	if (!nvkm_secboot_is_managed(device->secboot,
194 				     NVKM_SECBOOT_FALCON_GPCCS)) {
195 		if ((ret = gf100_gr_ctor_fw(gr, "gr/gpccs_inst", &gr->fuc41ac)) ||
196 		    (ret = gf100_gr_ctor_fw(gr, "gr/gpccs_data", &gr->fuc41ad)))
197 			return ret;
198 	}
199 
200 	if ((ret = gk20a_gr_av_to_init(gr, "gr/sw_nonctx", &gr->fuc_sw_nonctx)) ||
201 	    (ret = gk20a_gr_aiv_to_init(gr, "gr/sw_ctx", &gr->fuc_sw_ctx)) ||
202 	    (ret = gk20a_gr_av_to_init(gr, "gr/sw_bundle_init", &gr->fuc_bundle)) ||
203 	    (ret = gk20a_gr_av_to_method(gr, "gr/sw_method_init", &gr->fuc_method)))
204 		return ret;
205 
206 	return 0;
207 }
208 
209 static const struct gf100_gr_func
210 gm200_gr = {
211 	.init = gm200_gr_init,
212 	.init_gpc_mmu = gm200_gr_init_gpc_mmu,
213 	.init_rop_active_fbps = gm200_gr_init_rop_active_fbps,
214 	.init_ppc_exceptions = gk104_gr_init_ppc_exceptions,
215 	.rops = gm200_gr_rops,
216 	.ppc_nr = 2,
217 	.grctx = &gm200_grctx,
218 	.sclass = {
219 		{ -1, -1, FERMI_TWOD_A },
220 		{ -1, -1, KEPLER_INLINE_TO_MEMORY_B },
221 		{ -1, -1, MAXWELL_B, &gf100_fermi },
222 		{ -1, -1, MAXWELL_COMPUTE_B },
223 		{}
224 	}
225 };
226 
227 int
228 gm200_gr_new(struct nvkm_device *device, int index, struct nvkm_gr **pgr)
229 {
230 	return gm200_gr_new_(&gm200_gr, device, index, pgr);
231 }
232