1 /*
2  * Copyright 2010 Red Hat Inc.
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice shall be included in
12  * all copies or substantial portions of the Software.
13  *
14  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20  * OTHER DEALINGS IN THE SOFTWARE.
21  *
22  * Authors: Ben Skeggs
23  */
24 #ifndef __GF100_GR_H__
25 #define __GF100_GR_H__
26 #define gf100_gr(p) container_of((p), struct gf100_gr, base)
27 #include "priv.h"
28 
29 #include <core/gpuobj.h>
30 #include <subdev/ltc.h>
31 #include <subdev/mmu.h>
32 #include <engine/falcon.h>
33 
34 #define GPC_MAX 32
35 #define TPC_MAX_PER_GPC 8
36 #define TPC_MAX (GPC_MAX * TPC_MAX_PER_GPC)
37 
38 #define ROP_BCAST(r)      (0x408800 + (r))
39 #define ROP_UNIT(u, r)    (0x410000 + (u) * 0x400 + (r))
40 #define GPC_BCAST(r)      (0x418000 + (r))
41 #define GPC_UNIT(t, r)    (0x500000 + (t) * 0x8000 + (r))
42 #define PPC_UNIT(t, m, r) (0x503000 + (t) * 0x8000 + (m) * 0x200 + (r))
43 #define TPC_UNIT(t, m, r) (0x504000 + (t) * 0x8000 + (m) * 0x800 + (r))
44 
45 struct gf100_gr_data {
46 	u32 size;
47 	u32 align;
48 	bool priv;
49 };
50 
51 struct gf100_gr_mmio {
52 	u32 addr;
53 	u32 data;
54 	u32 shift;
55 	int buffer;
56 };
57 
58 struct gf100_gr_fuc {
59 	u32 *data;
60 	u32  size;
61 };
62 
63 struct gf100_gr_zbc_color {
64 	u32 format;
65 	u32 ds[4];
66 	u32 l2[4];
67 };
68 
69 struct gf100_gr_zbc_depth {
70 	u32 format;
71 	u32 ds;
72 	u32 l2;
73 };
74 
75 struct gf100_gr_zbc_stencil {
76 	u32 format;
77 	u32 ds;
78 	u32 l2;
79 };
80 
81 struct gf100_gr {
82 	const struct gf100_gr_func *func;
83 	struct nvkm_gr base;
84 
85 	struct {
86 		struct nvkm_falcon *falcon;
87 		struct mutex mutex;
88 		u32 disable;
89 	} fecs;
90 
91 	struct {
92 		struct nvkm_falcon *falcon;
93 	} gpccs;
94 
95 	struct gf100_gr_fuc fuc409c;
96 	struct gf100_gr_fuc fuc409d;
97 	struct gf100_gr_fuc fuc41ac;
98 	struct gf100_gr_fuc fuc41ad;
99 	bool firmware;
100 
101 	/*
102 	 * Used if the register packs are loaded from NVIDIA fw instead of
103 	 * using hardcoded arrays. To be allocated with vzalloc().
104 	 */
105 	struct gf100_gr_pack *fuc_sw_nonctx;
106 	struct gf100_gr_pack *fuc_sw_ctx;
107 	struct gf100_gr_pack *fuc_bundle;
108 	struct gf100_gr_pack *fuc_method;
109 
110 	struct gf100_gr_zbc_color zbc_color[NVKM_LTC_MAX_ZBC_CNT];
111 	struct gf100_gr_zbc_depth zbc_depth[NVKM_LTC_MAX_ZBC_CNT];
112 	struct gf100_gr_zbc_stencil zbc_stencil[NVKM_LTC_MAX_ZBC_CNT];
113 
114 	u8 rop_nr;
115 	u8 gpc_nr;
116 	u8 tpc_nr[GPC_MAX];
117 	u8 tpc_max;
118 	u8 tpc_total;
119 	u8 ppc_nr[GPC_MAX];
120 	u8 ppc_mask[GPC_MAX];
121 	u8 ppc_tpc_mask[GPC_MAX][4];
122 	u8 ppc_tpc_nr[GPC_MAX][4];
123 	u8 ppc_tpc_min;
124 	u8 ppc_tpc_max;
125 
126 	u8 screen_tile_row_offset;
127 	u8 tile[TPC_MAX];
128 
129 	struct {
130 		u8 gpc;
131 		u8 tpc;
132 	} sm[TPC_MAX];
133 	u8 sm_nr;
134 
135 	struct gf100_gr_data mmio_data[4];
136 	struct gf100_gr_mmio mmio_list[4096/8];
137 	u32  size;
138 	u32 *data;
139 	u32 size_zcull;
140 	u32 size_pm;
141 };
142 
143 int gf100_gr_ctor(const struct gf100_gr_func *, struct nvkm_device *,
144 		  int, struct gf100_gr *);
145 int gf100_gr_new_(const struct gf100_gr_func *, struct nvkm_device *,
146 		  int, struct nvkm_gr **);
147 void *gf100_gr_dtor(struct nvkm_gr *);
148 
149 int gf100_gr_fecs_bind_pointer(struct gf100_gr *, u32 inst);
150 
151 struct gf100_gr_func_zbc {
152 	void (*clear_color)(struct gf100_gr *, int zbc);
153 	void (*clear_depth)(struct gf100_gr *, int zbc);
154 	int (*stencil_get)(struct gf100_gr *, int format,
155 			   const u32 ds, const u32 l2);
156 	void (*clear_stencil)(struct gf100_gr *, int zbc);
157 };
158 
159 struct gf100_gr_func {
160 	void (*dtor)(struct gf100_gr *);
161 	void (*oneinit_tiles)(struct gf100_gr *);
162 	void (*oneinit_sm_id)(struct gf100_gr *);
163 	int (*init)(struct gf100_gr *);
164 	void (*init_419bd8)(struct gf100_gr *);
165 	void (*init_gpc_mmu)(struct gf100_gr *);
166 	void (*init_r405a14)(struct gf100_gr *);
167 	void (*init_bios)(struct gf100_gr *);
168 	void (*init_vsc_stream_master)(struct gf100_gr *);
169 	void (*init_zcull)(struct gf100_gr *);
170 	void (*init_num_active_ltcs)(struct gf100_gr *);
171 	void (*init_rop_active_fbps)(struct gf100_gr *);
172 	void (*init_bios_2)(struct gf100_gr *);
173 	void (*init_swdx_pes_mask)(struct gf100_gr *);
174 	void (*init_fecs_exceptions)(struct gf100_gr *);
175 	void (*init_ds_hww_esr_2)(struct gf100_gr *);
176 	void (*init_40601c)(struct gf100_gr *);
177 	void (*init_sked_hww_esr)(struct gf100_gr *);
178 	void (*init_419cc0)(struct gf100_gr *);
179 	void (*init_419eb4)(struct gf100_gr *);
180 	void (*init_419c9c)(struct gf100_gr *);
181 	void (*init_ppc_exceptions)(struct gf100_gr *);
182 	void (*init_tex_hww_esr)(struct gf100_gr *, int gpc, int tpc);
183 	void (*init_504430)(struct gf100_gr *, int gpc, int tpc);
184 	void (*init_shader_exceptions)(struct gf100_gr *, int gpc, int tpc);
185 	void (*init_400054)(struct gf100_gr *);
186 	void (*init_4188a4)(struct gf100_gr *);
187 	void (*trap_mp)(struct gf100_gr *, int gpc, int tpc);
188 	void (*set_hww_esr_report_mask)(struct gf100_gr *);
189 	const struct gf100_gr_pack *mmio;
190 	struct {
191 		struct gf100_gr_ucode *ucode;
192 	} fecs;
193 	struct {
194 		struct gf100_gr_ucode *ucode;
195 	} gpccs;
196 	int (*rops)(struct gf100_gr *);
197 	int gpc_nr;
198 	int tpc_nr;
199 	int ppc_nr;
200 	const struct gf100_grctx_func *grctx;
201 	const struct nvkm_therm_clkgate_pack *clkgate_pack;
202 	const struct gf100_gr_func_zbc *zbc;
203 	struct nvkm_sclass sclass[];
204 };
205 
206 int gf100_gr_rops(struct gf100_gr *);
207 void gf100_gr_oneinit_tiles(struct gf100_gr *);
208 void gf100_gr_oneinit_sm_id(struct gf100_gr *);
209 int gf100_gr_init(struct gf100_gr *);
210 void gf100_gr_init_vsc_stream_master(struct gf100_gr *);
211 void gf100_gr_init_zcull(struct gf100_gr *);
212 void gf100_gr_init_num_active_ltcs(struct gf100_gr *);
213 void gf100_gr_init_fecs_exceptions(struct gf100_gr *);
214 void gf100_gr_init_40601c(struct gf100_gr *);
215 void gf100_gr_init_419cc0(struct gf100_gr *);
216 void gf100_gr_init_419eb4(struct gf100_gr *);
217 void gf100_gr_init_tex_hww_esr(struct gf100_gr *, int, int);
218 void gf100_gr_init_shader_exceptions(struct gf100_gr *, int, int);
219 void gf100_gr_init_400054(struct gf100_gr *);
220 extern const struct gf100_gr_func_zbc gf100_gr_zbc;
221 
222 void gf117_gr_init_zcull(struct gf100_gr *);
223 
224 void gk104_gr_init_vsc_stream_master(struct gf100_gr *);
225 void gk104_gr_init_rop_active_fbps(struct gf100_gr *);
226 void gk104_gr_init_ppc_exceptions(struct gf100_gr *);
227 void gk104_gr_init_sked_hww_esr(struct gf100_gr *);
228 
229 void gk110_gr_init_419eb4(struct gf100_gr *);
230 
231 void gm107_gr_init_504430(struct gf100_gr *, int, int);
232 void gm107_gr_init_shader_exceptions(struct gf100_gr *, int, int);
233 void gm107_gr_init_400054(struct gf100_gr *);
234 
235 int gk20a_gr_init(struct gf100_gr *);
236 
237 void gm200_gr_oneinit_tiles(struct gf100_gr *);
238 void gm200_gr_oneinit_sm_id(struct gf100_gr *);
239 int gm200_gr_rops(struct gf100_gr *);
240 void gm200_gr_init_num_active_ltcs(struct gf100_gr *);
241 void gm200_gr_init_ds_hww_esr_2(struct gf100_gr *);
242 
243 void gp100_gr_init_rop_active_fbps(struct gf100_gr *);
244 void gp100_gr_init_fecs_exceptions(struct gf100_gr *);
245 void gp100_gr_init_shader_exceptions(struct gf100_gr *, int, int);
246 void gp100_gr_zbc_clear_color(struct gf100_gr *, int);
247 void gp100_gr_zbc_clear_depth(struct gf100_gr *, int);
248 
249 void gp102_gr_init_swdx_pes_mask(struct gf100_gr *);
250 extern const struct gf100_gr_func_zbc gp102_gr_zbc;
251 
252 #define gf100_gr_chan(p) container_of((p), struct gf100_gr_chan, object)
253 #include <core/object.h>
254 
255 struct gf100_gr_chan {
256 	struct nvkm_object object;
257 	struct gf100_gr *gr;
258 	struct nvkm_vmm *vmm;
259 
260 	struct nvkm_memory *mmio;
261 	struct nvkm_vma *mmio_vma;
262 	int mmio_nr;
263 
264 	struct {
265 		struct nvkm_memory *mem;
266 		struct nvkm_vma *vma;
267 	} data[4];
268 };
269 
270 void gf100_gr_ctxctl_debug(struct gf100_gr *);
271 
272 void gf100_gr_dtor_fw(struct gf100_gr_fuc *);
273 int  gf100_gr_ctor_fw(struct gf100_gr *, const char *,
274 		      struct gf100_gr_fuc *);
275 u64  gf100_gr_units(struct nvkm_gr *);
276 void gf100_gr_zbc_init(struct gf100_gr *);
277 
278 extern const struct nvkm_object_func gf100_fermi;
279 
280 struct gf100_gr_init {
281 	u32 addr;
282 	u8  count;
283 	u32 pitch;
284 	u32 data;
285 };
286 
287 struct gf100_gr_pack {
288 	const struct gf100_gr_init *init;
289 	u32 type;
290 };
291 
292 #define pack_for_each_init(init, pack, head)                                   \
293 	for (pack = head; pack && pack->init; pack++)                          \
294 		  for (init = pack->init; init && init->count; init++)
295 
296 struct gf100_gr_ucode {
297 	struct gf100_gr_fuc code;
298 	struct gf100_gr_fuc data;
299 };
300 
301 extern struct gf100_gr_ucode gf100_gr_fecs_ucode;
302 extern struct gf100_gr_ucode gf100_gr_gpccs_ucode;
303 
304 extern struct gf100_gr_ucode gk110_gr_fecs_ucode;
305 extern struct gf100_gr_ucode gk110_gr_gpccs_ucode;
306 
307 int  gf100_gr_wait_idle(struct gf100_gr *);
308 void gf100_gr_mmio(struct gf100_gr *, const struct gf100_gr_pack *);
309 void gf100_gr_icmd(struct gf100_gr *, const struct gf100_gr_pack *);
310 void gf100_gr_mthd(struct gf100_gr *, const struct gf100_gr_pack *);
311 int  gf100_gr_init_ctxctl(struct gf100_gr *);
312 
313 /* external bundles loading functions */
314 int gk20a_gr_av_to_init(struct gf100_gr *, const char *,
315 			struct gf100_gr_pack **);
316 int gk20a_gr_aiv_to_init(struct gf100_gr *, const char *,
317 			 struct gf100_gr_pack **);
318 int gk20a_gr_av_to_method(struct gf100_gr *, const char *,
319 			  struct gf100_gr_pack **);
320 
321 int gm200_gr_new_(const struct gf100_gr_func *, struct nvkm_device *, int,
322 		  struct nvkm_gr **);
323 
324 /* register init value lists */
325 
326 extern const struct gf100_gr_init gf100_gr_init_main_0[];
327 extern const struct gf100_gr_init gf100_gr_init_fe_0[];
328 extern const struct gf100_gr_init gf100_gr_init_pri_0[];
329 extern const struct gf100_gr_init gf100_gr_init_rstr2d_0[];
330 extern const struct gf100_gr_init gf100_gr_init_pd_0[];
331 extern const struct gf100_gr_init gf100_gr_init_ds_0[];
332 extern const struct gf100_gr_init gf100_gr_init_scc_0[];
333 extern const struct gf100_gr_init gf100_gr_init_prop_0[];
334 extern const struct gf100_gr_init gf100_gr_init_gpc_unk_0[];
335 extern const struct gf100_gr_init gf100_gr_init_setup_0[];
336 extern const struct gf100_gr_init gf100_gr_init_crstr_0[];
337 extern const struct gf100_gr_init gf100_gr_init_setup_1[];
338 extern const struct gf100_gr_init gf100_gr_init_zcull_0[];
339 extern const struct gf100_gr_init gf100_gr_init_gpm_0[];
340 extern const struct gf100_gr_init gf100_gr_init_gpc_unk_1[];
341 extern const struct gf100_gr_init gf100_gr_init_gcc_0[];
342 extern const struct gf100_gr_init gf100_gr_init_tpccs_0[];
343 extern const struct gf100_gr_init gf100_gr_init_tex_0[];
344 extern const struct gf100_gr_init gf100_gr_init_pe_0[];
345 extern const struct gf100_gr_init gf100_gr_init_l1c_0[];
346 extern const struct gf100_gr_init gf100_gr_init_wwdx_0[];
347 extern const struct gf100_gr_init gf100_gr_init_tpccs_1[];
348 extern const struct gf100_gr_init gf100_gr_init_mpc_0[];
349 extern const struct gf100_gr_init gf100_gr_init_be_0[];
350 extern const struct gf100_gr_init gf100_gr_init_fe_1[];
351 extern const struct gf100_gr_init gf100_gr_init_pe_1[];
352 void gf100_gr_init_gpc_mmu(struct gf100_gr *);
353 void gf100_gr_trap_mp(struct gf100_gr *, int, int);
354 extern const struct nvkm_bitfield gf100_mp_global_error[];
355 extern const struct nvkm_enum gf100_mp_warp_error[];
356 
357 extern const struct gf100_gr_init gf104_gr_init_ds_0[];
358 extern const struct gf100_gr_init gf104_gr_init_tex_0[];
359 extern const struct gf100_gr_init gf104_gr_init_sm_0[];
360 
361 extern const struct gf100_gr_init gf108_gr_init_gpc_unk_0[];
362 extern const struct gf100_gr_init gf108_gr_init_setup_1[];
363 
364 extern const struct gf100_gr_init gf119_gr_init_pd_0[];
365 extern const struct gf100_gr_init gf119_gr_init_ds_0[];
366 extern const struct gf100_gr_init gf119_gr_init_prop_0[];
367 extern const struct gf100_gr_init gf119_gr_init_gpm_0[];
368 extern const struct gf100_gr_init gf119_gr_init_gpc_unk_1[];
369 extern const struct gf100_gr_init gf119_gr_init_tex_0[];
370 extern const struct gf100_gr_init gf119_gr_init_sm_0[];
371 extern const struct gf100_gr_init gf119_gr_init_fe_1[];
372 
373 extern const struct gf100_gr_init gf117_gr_init_pes_0[];
374 extern const struct gf100_gr_init gf117_gr_init_wwdx_0[];
375 extern const struct gf100_gr_init gf117_gr_init_cbm_0[];
376 
377 extern const struct gf100_gr_init gk104_gr_init_main_0[];
378 extern const struct gf100_gr_init gk104_gr_init_gpc_unk_2[];
379 extern const struct gf100_gr_init gk104_gr_init_tpccs_0[];
380 extern const struct gf100_gr_init gk104_gr_init_pe_0[];
381 extern const struct gf100_gr_init gk104_gr_init_be_0[];
382 extern const struct gf100_gr_pack gk104_gr_pack_mmio[];
383 
384 extern const struct gf100_gr_init gk110_gr_init_fe_0[];
385 extern const struct gf100_gr_init gk110_gr_init_ds_0[];
386 extern const struct gf100_gr_init gk110_gr_init_sked_0[];
387 extern const struct gf100_gr_init gk110_gr_init_cwd_0[];
388 extern const struct gf100_gr_init gk110_gr_init_gpc_unk_1[];
389 extern const struct gf100_gr_init gk110_gr_init_tex_0[];
390 extern const struct gf100_gr_init gk110_gr_init_sm_0[];
391 
392 extern const struct gf100_gr_init gk208_gr_init_gpc_unk_0[];
393 
394 extern const struct gf100_gr_init gm107_gr_init_scc_0[];
395 extern const struct gf100_gr_init gm107_gr_init_prop_0[];
396 extern const struct gf100_gr_init gm107_gr_init_setup_1[];
397 extern const struct gf100_gr_init gm107_gr_init_zcull_0[];
398 extern const struct gf100_gr_init gm107_gr_init_gpc_unk_1[];
399 extern const struct gf100_gr_init gm107_gr_init_tex_0[];
400 extern const struct gf100_gr_init gm107_gr_init_l1c_0[];
401 extern const struct gf100_gr_init gm107_gr_init_wwdx_0[];
402 extern const struct gf100_gr_init gm107_gr_init_cbm_0[];
403 void gm107_gr_init_bios(struct gf100_gr *);
404 
405 void gm200_gr_init_gpc_mmu(struct gf100_gr *);
406 #endif
407