1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22#include "gk104.h"
23#include "cgrp.h"
24#include "changk104.h"
25#include "user.h"
26
27#include <core/client.h>
28#include <core/gpuobj.h>
29#include <subdev/bar.h>
30#include <subdev/fault.h>
31#include <subdev/top.h>
32#include <subdev/timer.h>
33#include <engine/sw.h>
34
35#include <nvif/class.h>
36
37static void
38tu102_fifo_runlist_commit(struct gk104_fifo *fifo, int runl,
39 struct nvkm_memory *mem, int nr)
40{
41 struct nvkm_device *device = fifo->base.engine.subdev.device;
42 u64 addr = nvkm_memory_addr(mem);
43
44
45 nvkm_wr32(device, 0x002b00 + (runl * 0x10), lower_32_bits(addr));
46 nvkm_wr32(device, 0x002b04 + (runl * 0x10), upper_32_bits(addr));
47 nvkm_wr32(device, 0x002b08 + (runl * 0x10), nr);
48
49
50}
51
52const struct gk104_fifo_runlist_func
53tu102_fifo_runlist = {
54 .size = 16,
55 .cgrp = gv100_fifo_runlist_cgrp,
56 .chan = gv100_fifo_runlist_chan,
57 .commit = tu102_fifo_runlist_commit,
58};
59
60static const struct nvkm_enum
61tu102_fifo_fault_engine[] = {
62 { 0x01, "DISPLAY" },
63 { 0x03, "PTP" },
64 { 0x06, "PWR_PMU" },
65 { 0x08, "IFB", NULL, NVKM_ENGINE_IFB },
66 { 0x09, "PERF" },
67 { 0x1f, "PHYSICAL" },
68 { 0x20, "HOST0" },
69 { 0x21, "HOST1" },
70 { 0x22, "HOST2" },
71 { 0x23, "HOST3" },
72 { 0x24, "HOST4" },
73 { 0x25, "HOST5" },
74 { 0x26, "HOST6" },
75 { 0x27, "HOST7" },
76 { 0x28, "HOST8" },
77 { 0x29, "HOST9" },
78 { 0x2a, "HOST10" },
79 { 0x2b, "HOST11" },
80 { 0x2c, "HOST12" },
81 { 0x2d, "HOST13" },
82 { 0x2e, "HOST14" },
83 { 0x80, "BAR1", NULL, NVKM_SUBDEV_BAR },
84 { 0xc0, "BAR2", NULL, NVKM_SUBDEV_INSTMEM },
85 {}
86};
87
88static void
89tu102_fifo_pbdma_init(struct gk104_fifo *fifo)
90{
91 struct nvkm_device *device = fifo->base.engine.subdev.device;
92 const u32 mask = (1 << fifo->pbdma_nr) - 1;
93
94 nvkm_mask(device, 0xb65000, 0x80000fff, 0x80000000 | mask);
95}
96
97static const struct gk104_fifo_pbdma_func
98tu102_fifo_pbdma = {
99 .nr = gm200_fifo_pbdma_nr,
100 .init = tu102_fifo_pbdma_init,
101 .init_timeout = gk208_fifo_pbdma_init_timeout,
102};
103
104static const struct gk104_fifo_func
105tu102_fifo = {
106 .pbdma = &tu102_fifo_pbdma,
107 .fault.access = gv100_fifo_fault_access,
108 .fault.engine = tu102_fifo_fault_engine,
109 .fault.reason = gv100_fifo_fault_reason,
110 .fault.hubclient = gv100_fifo_fault_hubclient,
111 .fault.gpcclient = gv100_fifo_fault_gpcclient,
112 .runlist = &tu102_fifo_runlist,
113 .user = {{-1,-1,VOLTA_USERMODE_A }, tu102_fifo_user_new },
114 .chan = {{ 0, 0,TURING_CHANNEL_GPFIFO_A}, tu102_fifo_gpfifo_new },
115 .cgrp_force = true,
116};
117
118static void
119tu102_fifo_recover_work(struct work_struct *w)
120{
121 struct gk104_fifo *fifo = container_of(w, typeof(*fifo), recover.work);
122 struct nvkm_device *device = fifo->base.engine.subdev.device;
123 struct nvkm_engine *engine;
124 unsigned long flags;
125 u32 engm, runm, todo;
126 int engn, runl;
127
128 spin_lock_irqsave(&fifo->base.lock, flags);
129 runm = fifo->recover.runm;
130 engm = fifo->recover.engm;
131 fifo->recover.engm = 0;
132 fifo->recover.runm = 0;
133 spin_unlock_irqrestore(&fifo->base.lock, flags);
134
135 nvkm_mask(device, 0x002630, runm, runm);
136
137 for (todo = engm; engn = __ffs(todo), todo; todo &= ~BIT(engn)) {
138 if ((engine = fifo->engine[engn].engine)) {
139 nvkm_subdev_fini(&engine->subdev, false);
140 WARN_ON(nvkm_subdev_init(&engine->subdev));
141 }
142 }
143
144 for (todo = runm; runl = __ffs(todo), todo; todo &= ~BIT(runl))
145 gk104_fifo_runlist_update(fifo, runl);
146
147 nvkm_mask(device, 0x002630, runm, 0x00000000);
148}
149
150static void tu102_fifo_recover_engn(struct gk104_fifo *fifo, int engn);
151
152static void
153tu102_fifo_recover_runl(struct gk104_fifo *fifo, int runl)
154{
155 struct nvkm_subdev *subdev = &fifo->base.engine.subdev;
156 struct nvkm_device *device = subdev->device;
157 const u32 runm = BIT(runl);
158
159 assert_spin_locked(&fifo->base.lock);
160 if (fifo->recover.runm & runm)
161 return;
162 fifo->recover.runm |= runm;
163
164
165 nvkm_mask(device, 0x002630, runm, runm);
166
167
168 nvkm_warn(subdev, "runlist %d: scheduled for recovery\n", runl);
169 schedule_work(&fifo->recover.work);
170}
171
172static struct gk104_fifo_chan *
173tu102_fifo_recover_chid(struct gk104_fifo *fifo, int runl, int chid)
174{
175 struct gk104_fifo_chan *chan;
176 struct nvkm_fifo_cgrp *cgrp;
177
178 list_for_each_entry(chan, &fifo->runlist[runl].chan, head) {
179 if (chan->base.chid == chid) {
180 list_del_init(&chan->head);
181 return chan;
182 }
183 }
184
185 list_for_each_entry(cgrp, &fifo->runlist[runl].cgrp, head) {
186 if (cgrp->id == chid) {
187 chan = list_first_entry(&cgrp->chan, typeof(*chan), head);
188 list_del_init(&chan->head);
189 if (!--cgrp->chan_nr)
190 list_del_init(&cgrp->head);
191 return chan;
192 }
193 }
194
195 return NULL;
196}
197
198static void
199tu102_fifo_recover_chan(struct nvkm_fifo *base, int chid)
200{
201 struct gk104_fifo *fifo = gk104_fifo(base);
202 struct nvkm_subdev *subdev = &fifo->base.engine.subdev;
203 struct nvkm_device *device = subdev->device;
204 const u32 stat = nvkm_rd32(device, 0x800004 + (chid * 0x08));
205 const u32 runl = (stat & 0x000f0000) >> 16;
206 const bool used = (stat & 0x00000001);
207 unsigned long engn, engm = fifo->runlist[runl].engm;
208 struct gk104_fifo_chan *chan;
209
210 assert_spin_locked(&fifo->base.lock);
211 if (!used)
212 return;
213
214
215 chan = tu102_fifo_recover_chid(fifo, runl, chid);
216 if (chan) {
217 chan->killed = true;
218 nvkm_fifo_kevent(&fifo->base, chid);
219 }
220
221
222 nvkm_wr32(device, 0x800004 + (chid * 0x08), stat | 0x00000800);
223 nvkm_warn(subdev, "channel %d: killed\n", chid);
224
225
226 tu102_fifo_recover_runl(fifo, runl);
227
228
229 for_each_set_bit(engn, &engm, fifo->engine_nr) {
230 struct gk104_fifo_engine_status status;
231
232 gk104_fifo_engine_status(fifo, engn, &status);
233 if (!status.chan || status.chan->id != chid)
234 continue;
235 tu102_fifo_recover_engn(fifo, engn);
236 }
237}
238
239static void
240tu102_fifo_recover_engn(struct gk104_fifo *fifo, int engn)
241{
242 struct nvkm_subdev *subdev = &fifo->base.engine.subdev;
243 struct nvkm_device *device = subdev->device;
244 const u32 runl = fifo->engine[engn].runl;
245 const u32 engm = BIT(engn);
246 struct gk104_fifo_engine_status status;
247
248 assert_spin_locked(&fifo->base.lock);
249 if (fifo->recover.engm & engm)
250 return;
251 fifo->recover.engm |= engm;
252
253
254 tu102_fifo_recover_runl(fifo, runl);
255
256
257 gk104_fifo_engine_status(fifo, engn, &status);
258 if (status.chan) {
259
260 tu102_fifo_recover_chan(&fifo->base, status.chan->id);
261 }
262
263
264 nvkm_wr32(device, 0x2638, BIT(runl));
265
266
267 nvkm_warn(subdev, "engine %d: scheduled for recovery\n", engn);
268 schedule_work(&fifo->recover.work);
269}
270
271static void
272tu102_fifo_fault(struct nvkm_fifo *base, struct nvkm_fault_data *info)
273{
274 struct gk104_fifo *fifo = gk104_fifo(base);
275 struct nvkm_subdev *subdev = &fifo->base.engine.subdev;
276 struct nvkm_device *device = subdev->device;
277 const struct nvkm_enum *er, *ee, *ec, *ea;
278 struct nvkm_engine *engine = NULL;
279 struct nvkm_fifo_chan *chan;
280 unsigned long flags;
281 const char *en = "";
282 char ct[8] = "HUB/";
283 int engn;
284
285 er = nvkm_enum_find(fifo->func->fault.reason, info->reason);
286 ee = nvkm_enum_find(fifo->func->fault.engine, info->engine);
287 if (info->hub) {
288 ec = nvkm_enum_find(fifo->func->fault.hubclient, info->client);
289 } else {
290 ec = nvkm_enum_find(fifo->func->fault.gpcclient, info->client);
291 snprintf(ct, sizeof(ct), "GPC%d/", info->gpc);
292 }
293 ea = nvkm_enum_find(fifo->func->fault.access, info->access);
294
295 if (ee && ee->data2) {
296 switch (ee->data2) {
297 case NVKM_SUBDEV_BAR:
298 nvkm_bar_bar1_reset(device);
299 break;
300 case NVKM_SUBDEV_INSTMEM:
301 nvkm_bar_bar2_reset(device);
302 break;
303 case NVKM_ENGINE_IFB:
304 nvkm_mask(device, 0x001718, 0x00000000, 0x00000000);
305 break;
306 default:
307 engine = nvkm_device_engine(device, ee->data2, 0);
308 break;
309 }
310 }
311
312 if (ee == NULL) {
313 struct nvkm_subdev *subdev = nvkm_top_fault(device, info->engine);
314 if (subdev) {
315 if (subdev->func == &nvkm_engine)
316 engine = container_of(subdev, typeof(*engine), subdev);
317 en = engine->subdev.name;
318 }
319 } else {
320 en = ee->name;
321 }
322
323 spin_lock_irqsave(&fifo->base.lock, flags);
324 chan = nvkm_fifo_chan_inst_locked(&fifo->base, info->inst);
325
326 nvkm_error(subdev,
327 "fault %02x [%s] at %016llx engine %02x [%s] client %02x "
328 "[%s%s] reason %02x [%s] on channel %d [%010llx %s]\n",
329 info->access, ea ? ea->name : "", info->addr,
330 info->engine, ee ? ee->name : en,
331 info->client, ct, ec ? ec->name : "",
332 info->reason, er ? er->name : "", chan ? chan->chid : -1,
333 info->inst, chan ? chan->object.client->name : "unknown");
334
335
336 if (chan)
337 tu102_fifo_recover_chan(&fifo->base, chan->chid);
338
339
340
341
342
343 for (engn = 0; engn < fifo->engine_nr && engine; engn++) {
344 if (fifo->engine[engn].engine == engine) {
345 tu102_fifo_recover_engn(fifo, engn);
346 break;
347 }
348 }
349
350 spin_unlock_irqrestore(&fifo->base.lock, flags);
351}
352
353static void
354tu102_fifo_intr_ctxsw_timeout(struct gk104_fifo *fifo)
355{
356 struct nvkm_device *device = fifo->base.engine.subdev.device;
357 unsigned long flags, engm;
358 u32 engn;
359
360 spin_lock_irqsave(&fifo->base.lock, flags);
361
362 engm = nvkm_rd32(device, 0x2a30);
363 nvkm_wr32(device, 0x2a30, engm);
364
365 for_each_set_bit(engn, &engm, 32)
366 tu102_fifo_recover_engn(fifo, engn);
367
368 spin_unlock_irqrestore(&fifo->base.lock, flags);
369}
370
371static void
372tu102_fifo_intr_sched(struct gk104_fifo *fifo)
373{
374 struct nvkm_subdev *subdev = &fifo->base.engine.subdev;
375 struct nvkm_device *device = subdev->device;
376 u32 intr = nvkm_rd32(device, 0x00254c);
377 u32 code = intr & 0x000000ff;
378
379 nvkm_error(subdev, "SCHED_ERROR %02x\n", code);
380}
381
382static void
383tu102_fifo_intr(struct nvkm_fifo *base)
384{
385 struct gk104_fifo *fifo = gk104_fifo(base);
386 struct nvkm_subdev *subdev = &fifo->base.engine.subdev;
387 struct nvkm_device *device = subdev->device;
388 u32 mask = nvkm_rd32(device, 0x002140);
389 u32 stat = nvkm_rd32(device, 0x002100) & mask;
390
391 if (stat & 0x00000001) {
392 gk104_fifo_intr_bind(fifo);
393 nvkm_wr32(device, 0x002100, 0x00000001);
394 stat &= ~0x00000001;
395 }
396
397 if (stat & 0x00000002) {
398 tu102_fifo_intr_ctxsw_timeout(fifo);
399 stat &= ~0x00000002;
400 }
401
402 if (stat & 0x00000100) {
403 tu102_fifo_intr_sched(fifo);
404 nvkm_wr32(device, 0x002100, 0x00000100);
405 stat &= ~0x00000100;
406 }
407
408 if (stat & 0x00010000) {
409 gk104_fifo_intr_chsw(fifo);
410 nvkm_wr32(device, 0x002100, 0x00010000);
411 stat &= ~0x00010000;
412 }
413
414 if (stat & 0x20000000) {
415 u32 mask = nvkm_rd32(device, 0x0025a0);
416
417 while (mask) {
418 u32 unit = __ffs(mask);
419
420 gk104_fifo_intr_pbdma_0(fifo, unit);
421 gk104_fifo_intr_pbdma_1(fifo, unit);
422 nvkm_wr32(device, 0x0025a0, (1 << unit));
423 mask &= ~(1 << unit);
424 }
425 stat &= ~0x20000000;
426 }
427
428 if (stat & 0x40000000) {
429 gk104_fifo_intr_runlist(fifo);
430 stat &= ~0x40000000;
431 }
432
433 if (stat & 0x80000000) {
434 nvkm_wr32(device, 0x002100, 0x80000000);
435 gk104_fifo_intr_engine(fifo);
436 stat &= ~0x80000000;
437 }
438
439 if (stat) {
440 nvkm_error(subdev, "INTR %08x\n", stat);
441 nvkm_mask(device, 0x002140, stat, 0x00000000);
442 nvkm_wr32(device, 0x002100, stat);
443 }
444}
445
446static const struct nvkm_fifo_func
447tu102_fifo_ = {
448 .dtor = gk104_fifo_dtor,
449 .oneinit = gk104_fifo_oneinit,
450 .info = gk104_fifo_info,
451 .init = gk104_fifo_init,
452 .fini = gk104_fifo_fini,
453 .intr = tu102_fifo_intr,
454 .fault = tu102_fifo_fault,
455 .engine_id = gk104_fifo_engine_id,
456 .id_engine = gk104_fifo_id_engine,
457 .uevent_init = gk104_fifo_uevent_init,
458 .uevent_fini = gk104_fifo_uevent_fini,
459 .recover_chan = tu102_fifo_recover_chan,
460 .class_get = gk104_fifo_class_get,
461 .class_new = gk104_fifo_class_new,
462};
463
464int
465tu102_fifo_new(struct nvkm_device *device, enum nvkm_subdev_type type, int inst,
466 struct nvkm_fifo **pfifo)
467{
468 struct gk104_fifo *fifo;
469
470 if (!(fifo = kzalloc(sizeof(*fifo), GFP_KERNEL)))
471 return -ENOMEM;
472 fifo->func = &tu102_fifo;
473 INIT_WORK(&fifo->recover.work, tu102_fifo_recover_work);
474 *pfifo = &fifo->base;
475
476 return nvkm_fifo_ctor(&tu102_fifo_, device, type, inst, 4096, &fifo->base);
477}
478