1 /* 2 * Copyright 2010 Red Hat Inc. 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice shall be included in 12 * all copies or substantial portions of the Software. 13 * 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR 18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 20 * OTHER DEALINGS IN THE SOFTWARE. 21 * 22 * Authors: Ben Skeggs 23 */ 24 #ifndef __GF100_GR_H__ 25 #define __GF100_GR_H__ 26 #define gf100_gr(p) container_of((p), struct gf100_gr, base) 27 #include "priv.h" 28 29 #include <core/gpuobj.h> 30 #include <subdev/ltc.h> 31 #include <subdev/mmu.h> 32 #include <engine/falcon.h> 33 34 struct nvkm_acr_lsfw; 35 36 #define GPC_MAX 32 37 #define TPC_MAX_PER_GPC 8 38 #define TPC_MAX (GPC_MAX * TPC_MAX_PER_GPC) 39 40 #define ROP_BCAST(r) (0x408800 + (r)) 41 #define ROP_UNIT(u, r) (0x410000 + (u) * 0x400 + (r)) 42 #define GPC_BCAST(r) (0x418000 + (r)) 43 #define GPC_UNIT(t, r) (0x500000 + (t) * 0x8000 + (r)) 44 #define PPC_UNIT(t, m, r) (0x503000 + (t) * 0x8000 + (m) * 0x200 + (r)) 45 #define TPC_UNIT(t, m, r) (0x504000 + (t) * 0x8000 + (m) * 0x800 + (r)) 46 47 struct gf100_gr_zbc_color { 48 u32 format; 49 u32 ds[4]; 50 u32 l2[4]; 51 }; 52 53 struct gf100_gr_zbc_depth { 54 u32 format; 55 u32 ds; 56 u32 l2; 57 }; 58 59 struct gf100_gr_zbc_stencil { 60 u32 format; 61 u32 ds; 62 u32 l2; 63 }; 64 65 struct gf100_gr { 66 const struct gf100_gr_func *func; 67 struct nvkm_gr base; 68 69 struct { 70 struct nvkm_falcon falcon; 71 struct nvkm_blob inst; 72 struct nvkm_blob data; 73 74 struct mutex mutex; 75 u32 disable; 76 } fecs; 77 78 struct { 79 struct nvkm_falcon falcon; 80 struct nvkm_blob inst; 81 struct nvkm_blob data; 82 } gpccs; 83 84 bool firmware; 85 86 /* 87 * Used if the register packs are loaded from NVIDIA fw instead of 88 * using hardcoded arrays. To be allocated with vzalloc(). 89 */ 90 struct gf100_gr_pack *sw_nonctx; 91 struct gf100_gr_pack *sw_nonctx1; 92 struct gf100_gr_pack *sw_nonctx2; 93 struct gf100_gr_pack *sw_nonctx3; 94 struct gf100_gr_pack *sw_nonctx4; 95 struct gf100_gr_pack *sw_ctx; 96 struct gf100_gr_pack *bundle; 97 struct gf100_gr_pack *bundle_veid; 98 struct gf100_gr_pack *bundle64; 99 struct gf100_gr_pack *method; 100 101 struct gf100_gr_zbc_color zbc_color[NVKM_LTC_MAX_ZBC_COLOR_CNT]; 102 struct gf100_gr_zbc_depth zbc_depth[NVKM_LTC_MAX_ZBC_DEPTH_CNT]; 103 struct gf100_gr_zbc_stencil zbc_stencil[NVKM_LTC_MAX_ZBC_DEPTH_CNT]; 104 105 u8 rop_nr; 106 u8 gpc_nr; 107 u8 tpc_nr[GPC_MAX]; 108 u8 tpc_max; 109 u8 tpc_total; 110 u8 ppc_nr[GPC_MAX]; 111 u8 ppc_mask[GPC_MAX]; 112 u8 ppc_tpc_mask[GPC_MAX][4]; 113 u8 ppc_tpc_nr[GPC_MAX][4]; 114 u8 ppc_tpc_min; 115 u8 ppc_tpc_max; 116 u8 ppc_total; 117 118 struct nvkm_memory *pagepool; 119 struct nvkm_memory *bundle_cb; 120 struct nvkm_memory *attrib_cb; 121 struct nvkm_memory *unknown; 122 123 u8 screen_tile_row_offset; 124 u8 tile[TPC_MAX]; 125 126 struct { 127 u8 gpc; 128 u8 tpc; 129 } sm[TPC_MAX]; 130 u8 sm_nr; 131 132 u32 size; 133 u32 *data; 134 u32 size_zcull; 135 u32 size_pm; 136 }; 137 138 int gf100_gr_fecs_bind_pointer(struct gf100_gr *, u32 inst); 139 int gf100_gr_fecs_wfi_golden_save(struct gf100_gr *, u32 inst); 140 141 struct gf100_gr_func_zbc { 142 void (*clear_color)(struct gf100_gr *, int zbc); 143 void (*clear_depth)(struct gf100_gr *, int zbc); 144 int (*stencil_get)(struct gf100_gr *, int format, 145 const u32 ds, const u32 l2); 146 void (*clear_stencil)(struct gf100_gr *, int zbc); 147 }; 148 149 struct gf100_gr_func { 150 int (*nonstall)(struct gf100_gr *); 151 struct nvkm_intr *(*oneinit_intr)(struct gf100_gr *, enum nvkm_intr_type *); 152 void (*oneinit_tiles)(struct gf100_gr *); 153 int (*oneinit_sm_id)(struct gf100_gr *); 154 int (*init)(struct gf100_gr *); 155 void (*init_419bd8)(struct gf100_gr *); 156 void (*init_gpc_mmu)(struct gf100_gr *); 157 void (*init_r405a14)(struct gf100_gr *); 158 void (*init_bios)(struct gf100_gr *); 159 void (*init_vsc_stream_master)(struct gf100_gr *); 160 void (*init_zcull)(struct gf100_gr *); 161 void (*init_num_active_ltcs)(struct gf100_gr *); 162 void (*init_rop_active_fbps)(struct gf100_gr *); 163 void (*init_bios_2)(struct gf100_gr *); 164 void (*init_swdx_pes_mask)(struct gf100_gr *); 165 void (*init_fs)(struct gf100_gr *); 166 void (*init_fecs_exceptions)(struct gf100_gr *); 167 void (*init_40a790)(struct gf100_gr *); 168 void (*init_ds_hww_esr_2)(struct gf100_gr *); 169 void (*init_40601c)(struct gf100_gr *); 170 void (*init_sked_hww_esr)(struct gf100_gr *); 171 void (*init_419cc0)(struct gf100_gr *); 172 void (*init_419eb4)(struct gf100_gr *); 173 void (*init_419c9c)(struct gf100_gr *); 174 void (*init_ppc_exceptions)(struct gf100_gr *); 175 void (*init_tex_hww_esr)(struct gf100_gr *, int gpc, int tpc); 176 void (*init_504430)(struct gf100_gr *, int gpc, int tpc); 177 void (*init_shader_exceptions)(struct gf100_gr *, int gpc, int tpc); 178 void (*init_rop_exceptions)(struct gf100_gr *); 179 void (*init_exception2)(struct gf100_gr *); 180 void (*init_400054)(struct gf100_gr *); 181 void (*init_4188a4)(struct gf100_gr *); 182 void (*trap_mp)(struct gf100_gr *, int gpc, int tpc); 183 void (*set_hww_esr_report_mask)(struct gf100_gr *); 184 const struct gf100_gr_pack *mmio; 185 struct { 186 struct gf100_gr_ucode *ucode; 187 void (*reset)(struct gf100_gr *); 188 } fecs; 189 struct { 190 struct gf100_gr_ucode *ucode; 191 void (*reset)(struct gf100_gr *); 192 } gpccs; 193 int (*rops)(struct gf100_gr *); 194 int gpc_nr; 195 int tpc_nr; 196 int ppc_nr; 197 const struct gf100_grctx_func *grctx; 198 const struct nvkm_therm_clkgate_pack *clkgate_pack; 199 const struct gf100_gr_func_zbc *zbc; 200 struct nvkm_sclass sclass[]; 201 }; 202 203 int gf100_gr_rops(struct gf100_gr *); 204 void gf100_gr_oneinit_tiles(struct gf100_gr *); 205 int gf100_gr_oneinit_sm_id(struct gf100_gr *); 206 int gf100_gr_init(struct gf100_gr *); 207 void gf100_gr_init_vsc_stream_master(struct gf100_gr *); 208 void gf100_gr_init_zcull(struct gf100_gr *); 209 void gf100_gr_init_num_active_ltcs(struct gf100_gr *); 210 void gf100_gr_init_fecs_exceptions(struct gf100_gr *); 211 void gf100_gr_init_40601c(struct gf100_gr *); 212 void gf100_gr_init_419cc0(struct gf100_gr *); 213 void gf100_gr_init_419eb4(struct gf100_gr *); 214 void gf100_gr_init_tex_hww_esr(struct gf100_gr *, int, int); 215 void gf100_gr_init_shader_exceptions(struct gf100_gr *, int, int); 216 void gf100_gr_init_rop_exceptions(struct gf100_gr *); 217 void gf100_gr_init_exception2(struct gf100_gr *); 218 void gf100_gr_init_400054(struct gf100_gr *); 219 void gf100_gr_init_num_tpc_per_gpc(struct gf100_gr *, bool, bool); 220 extern const struct gf100_gr_func_zbc gf100_gr_zbc; 221 void gf100_gr_fecs_reset(struct gf100_gr *); 222 223 void gf117_gr_init_zcull(struct gf100_gr *); 224 225 void gk104_gr_init_vsc_stream_master(struct gf100_gr *); 226 void gk104_gr_init_rop_active_fbps(struct gf100_gr *); 227 void gk104_gr_init_ppc_exceptions(struct gf100_gr *); 228 void gk104_gr_init_sked_hww_esr(struct gf100_gr *); 229 230 void gk110_gr_init_419eb4(struct gf100_gr *); 231 232 void gm107_gr_init_504430(struct gf100_gr *, int, int); 233 void gm107_gr_init_shader_exceptions(struct gf100_gr *, int, int); 234 void gm107_gr_init_400054(struct gf100_gr *); 235 236 int gk20a_gr_init(struct gf100_gr *); 237 int gk20a_gr_av_to_init_(struct nvkm_blob *, u8 count, u32 pitch, struct gf100_gr_pack **); 238 int gk20a_gr_av_to_init(struct nvkm_blob *, struct gf100_gr_pack **); 239 int gk20a_gr_aiv_to_init(struct nvkm_blob *, struct gf100_gr_pack **); 240 int gk20a_gr_av_to_method(struct nvkm_blob *, struct gf100_gr_pack **); 241 242 void gm200_gr_oneinit_tiles(struct gf100_gr *); 243 int gm200_gr_oneinit_sm_id(struct gf100_gr *); 244 int gm200_gr_rops(struct gf100_gr *); 245 void gm200_gr_init_num_active_ltcs(struct gf100_gr *); 246 void gm200_gr_init_ds_hww_esr_2(struct gf100_gr *); 247 248 void gp100_gr_init_rop_active_fbps(struct gf100_gr *); 249 void gp100_gr_init_fecs_exceptions(struct gf100_gr *); 250 void gp100_gr_init_shader_exceptions(struct gf100_gr *, int, int); 251 void gp100_gr_zbc_clear_color(struct gf100_gr *, int); 252 void gp100_gr_zbc_clear_depth(struct gf100_gr *, int); 253 extern const struct gf100_gr_func_zbc gp100_gr_zbc; 254 255 void gp102_gr_init_swdx_pes_mask(struct gf100_gr *); 256 extern const struct gf100_gr_func_zbc gp102_gr_zbc; 257 int gp102_gr_zbc_stencil_get(struct gf100_gr *, int, const u32, const u32); 258 void gp102_gr_zbc_clear_stencil(struct gf100_gr *, int); 259 260 extern const struct gf100_gr_func gp107_gr; 261 262 int gv100_gr_oneinit_sm_id(struct gf100_gr *); 263 u32 gv100_gr_nonpes_aware_tpc(struct gf100_gr *gr, u32 gpc, u32 tpc); 264 void gv100_gr_init_419bd8(struct gf100_gr *); 265 void gv100_gr_init_504430(struct gf100_gr *, int, int); 266 void gv100_gr_init_shader_exceptions(struct gf100_gr *, int, int); 267 void gv100_gr_init_4188a4(struct gf100_gr *); 268 void gv100_gr_trap_mp(struct gf100_gr *, int, int); 269 270 int tu102_gr_av_to_init_veid(struct nvkm_blob *, struct gf100_gr_pack **); 271 void tu102_gr_init_zcull(struct gf100_gr *); 272 void tu102_gr_init_fs(struct gf100_gr *); 273 void tu102_gr_init_fecs_exceptions(struct gf100_gr *); 274 275 #define gf100_gr_chan(p) container_of((p), struct gf100_gr_chan, object) 276 #include <core/object.h> 277 278 struct gf100_gr_chan { 279 struct nvkm_object object; 280 struct gf100_gr *gr; 281 struct nvkm_vmm *vmm; 282 283 struct nvkm_vma *pagepool; 284 struct nvkm_vma *bundle_cb; 285 struct nvkm_vma *attrib_cb; 286 struct nvkm_vma *unknown; 287 288 struct nvkm_memory *mmio; 289 struct nvkm_vma *mmio_vma; 290 int mmio_nr; 291 }; 292 293 void gf100_gr_ctxctl_debug(struct gf100_gr *); 294 295 u64 gf100_gr_units(struct nvkm_gr *); 296 void gf100_gr_zbc_init(struct gf100_gr *); 297 298 extern const struct nvkm_object_func gf100_fermi; 299 300 struct gf100_gr_init { 301 u32 addr; 302 u8 count; 303 u32 pitch; 304 u64 data; 305 }; 306 307 struct gf100_gr_pack { 308 const struct gf100_gr_init *init; 309 u32 type; 310 }; 311 312 #define pack_for_each_init(init, pack, head) \ 313 for (pack = head; pack && pack->init; pack++) \ 314 for (init = pack->init; init && init->count; init++) 315 316 struct gf100_gr_ucode { 317 struct nvkm_blob code; 318 struct nvkm_blob data; 319 }; 320 321 extern struct gf100_gr_ucode gf100_gr_fecs_ucode; 322 extern struct gf100_gr_ucode gf100_gr_gpccs_ucode; 323 324 extern struct gf100_gr_ucode gk110_gr_fecs_ucode; 325 extern struct gf100_gr_ucode gk110_gr_gpccs_ucode; 326 327 int gf100_gr_wait_idle(struct gf100_gr *); 328 void gf100_gr_mmio(struct gf100_gr *, const struct gf100_gr_pack *); 329 void gf100_gr_icmd(struct gf100_gr *, const struct gf100_gr_pack *); 330 void gf100_gr_mthd(struct gf100_gr *, const struct gf100_gr_pack *); 331 int gf100_gr_init_ctxctl(struct gf100_gr *); 332 333 /* register init value lists */ 334 335 extern const struct gf100_gr_init gf100_gr_init_main_0[]; 336 extern const struct gf100_gr_init gf100_gr_init_fe_0[]; 337 extern const struct gf100_gr_init gf100_gr_init_pri_0[]; 338 extern const struct gf100_gr_init gf100_gr_init_rstr2d_0[]; 339 extern const struct gf100_gr_init gf100_gr_init_pd_0[]; 340 extern const struct gf100_gr_init gf100_gr_init_ds_0[]; 341 extern const struct gf100_gr_init gf100_gr_init_scc_0[]; 342 extern const struct gf100_gr_init gf100_gr_init_prop_0[]; 343 extern const struct gf100_gr_init gf100_gr_init_gpc_unk_0[]; 344 extern const struct gf100_gr_init gf100_gr_init_setup_0[]; 345 extern const struct gf100_gr_init gf100_gr_init_crstr_0[]; 346 extern const struct gf100_gr_init gf100_gr_init_setup_1[]; 347 extern const struct gf100_gr_init gf100_gr_init_zcull_0[]; 348 extern const struct gf100_gr_init gf100_gr_init_gpm_0[]; 349 extern const struct gf100_gr_init gf100_gr_init_gpc_unk_1[]; 350 extern const struct gf100_gr_init gf100_gr_init_gcc_0[]; 351 extern const struct gf100_gr_init gf100_gr_init_tpccs_0[]; 352 extern const struct gf100_gr_init gf100_gr_init_tex_0[]; 353 extern const struct gf100_gr_init gf100_gr_init_pe_0[]; 354 extern const struct gf100_gr_init gf100_gr_init_l1c_0[]; 355 extern const struct gf100_gr_init gf100_gr_init_wwdx_0[]; 356 extern const struct gf100_gr_init gf100_gr_init_tpccs_1[]; 357 extern const struct gf100_gr_init gf100_gr_init_mpc_0[]; 358 extern const struct gf100_gr_init gf100_gr_init_be_0[]; 359 extern const struct gf100_gr_init gf100_gr_init_fe_1[]; 360 extern const struct gf100_gr_init gf100_gr_init_pe_1[]; 361 void gf100_gr_init_gpc_mmu(struct gf100_gr *); 362 void gf100_gr_trap_mp(struct gf100_gr *, int, int); 363 extern const struct nvkm_bitfield gf100_mp_global_error[]; 364 extern const struct nvkm_enum gf100_mp_warp_error[]; 365 366 extern const struct gf100_gr_init gf104_gr_init_ds_0[]; 367 extern const struct gf100_gr_init gf104_gr_init_tex_0[]; 368 extern const struct gf100_gr_init gf104_gr_init_sm_0[]; 369 370 extern const struct gf100_gr_init gf108_gr_init_gpc_unk_0[]; 371 extern const struct gf100_gr_init gf108_gr_init_setup_1[]; 372 373 extern const struct gf100_gr_init gf119_gr_init_pd_0[]; 374 extern const struct gf100_gr_init gf119_gr_init_ds_0[]; 375 extern const struct gf100_gr_init gf119_gr_init_prop_0[]; 376 extern const struct gf100_gr_init gf119_gr_init_gpm_0[]; 377 extern const struct gf100_gr_init gf119_gr_init_gpc_unk_1[]; 378 extern const struct gf100_gr_init gf119_gr_init_tex_0[]; 379 extern const struct gf100_gr_init gf119_gr_init_sm_0[]; 380 extern const struct gf100_gr_init gf119_gr_init_fe_1[]; 381 382 extern const struct gf100_gr_init gf117_gr_init_pes_0[]; 383 extern const struct gf100_gr_init gf117_gr_init_wwdx_0[]; 384 extern const struct gf100_gr_init gf117_gr_init_cbm_0[]; 385 386 extern const struct gf100_gr_init gk104_gr_init_main_0[]; 387 extern const struct gf100_gr_init gk104_gr_init_gpc_unk_2[]; 388 extern const struct gf100_gr_init gk104_gr_init_tpccs_0[]; 389 extern const struct gf100_gr_init gk104_gr_init_pe_0[]; 390 extern const struct gf100_gr_init gk104_gr_init_be_0[]; 391 extern const struct gf100_gr_pack gk104_gr_pack_mmio[]; 392 393 extern const struct gf100_gr_init gk110_gr_init_fe_0[]; 394 extern const struct gf100_gr_init gk110_gr_init_ds_0[]; 395 extern const struct gf100_gr_init gk110_gr_init_sked_0[]; 396 extern const struct gf100_gr_init gk110_gr_init_cwd_0[]; 397 extern const struct gf100_gr_init gk110_gr_init_gpc_unk_1[]; 398 extern const struct gf100_gr_init gk110_gr_init_tex_0[]; 399 extern const struct gf100_gr_init gk110_gr_init_sm_0[]; 400 401 extern const struct gf100_gr_init gk208_gr_init_gpc_unk_0[]; 402 403 extern const struct gf100_gr_init gm107_gr_init_scc_0[]; 404 extern const struct gf100_gr_init gm107_gr_init_prop_0[]; 405 extern const struct gf100_gr_init gm107_gr_init_setup_1[]; 406 extern const struct gf100_gr_init gm107_gr_init_zcull_0[]; 407 extern const struct gf100_gr_init gm107_gr_init_gpc_unk_1[]; 408 extern const struct gf100_gr_init gm107_gr_init_tex_0[]; 409 extern const struct gf100_gr_init gm107_gr_init_l1c_0[]; 410 extern const struct gf100_gr_init gm107_gr_init_wwdx_0[]; 411 extern const struct gf100_gr_init gm107_gr_init_cbm_0[]; 412 void gm107_gr_init_bios(struct gf100_gr *); 413 414 void gm200_gr_init_gpc_mmu(struct gf100_gr *); 415 416 struct gf100_gr_fwif { 417 int version; 418 int (*load)(struct gf100_gr *, int ver, const struct gf100_gr_fwif *); 419 const struct gf100_gr_func *func; 420 const struct nvkm_acr_lsf_func *fecs; 421 const struct nvkm_acr_lsf_func *gpccs; 422 }; 423 424 int gf100_gr_load(struct gf100_gr *, int, const struct gf100_gr_fwif *); 425 int gf100_gr_nofw(struct gf100_gr *, int, const struct gf100_gr_fwif *); 426 427 int gk20a_gr_load_sw(struct gf100_gr *, const char *path, int ver); 428 int gk20a_gr_load_net(struct gf100_gr *, const char *, const char *, int, 429 int (*)(struct nvkm_blob *, struct gf100_gr_pack **), 430 struct gf100_gr_pack **); 431 432 int gm200_gr_nofw(struct gf100_gr *, int, const struct gf100_gr_fwif *); 433 int gm200_gr_load(struct gf100_gr *, int, const struct gf100_gr_fwif *); 434 extern const struct nvkm_acr_lsf_func gm200_gr_gpccs_acr; 435 extern const struct nvkm_acr_lsf_func gm200_gr_fecs_acr; 436 437 extern const struct nvkm_acr_lsf_func gm20b_gr_fecs_acr; 438 void gm20b_gr_acr_bld_write(struct nvkm_acr *, u32, struct nvkm_acr_lsfw *); 439 void gm20b_gr_acr_bld_patch(struct nvkm_acr *, u32, s64); 440 441 extern const struct nvkm_acr_lsf_func gp108_gr_gpccs_acr; 442 extern const struct nvkm_acr_lsf_func gp108_gr_fecs_acr; 443 void gp108_gr_acr_bld_write(struct nvkm_acr *, u32, struct nvkm_acr_lsfw *); 444 void gp108_gr_acr_bld_patch(struct nvkm_acr *, u32, s64); 445 446 int gf100_gr_new_(const struct gf100_gr_fwif *, struct nvkm_device *, enum nvkm_subdev_type, int, 447 struct nvkm_gr **); 448 int r535_gr_new(const struct gf100_gr_func *, struct nvkm_device *, enum nvkm_subdev_type, int, 449 struct nvkm_gr **); 450 #endif 451