.. | .. |
---|
23 | 23 | #define REG_READ(offset) _REG_READ(rknpu_core_base, offset) |
---|
24 | 24 | #define REG_WRITE(value, offset) _REG_WRITE(rknpu_core_base, value, offset) |
---|
25 | 25 | |
---|
26 | | -static int rknpu_core_index(int core_mask) |
---|
| 26 | +static int rknpu_wait_core_index(int core_mask) |
---|
27 | 27 | { |
---|
28 | 28 | int index = 0; |
---|
29 | 29 | |
---|
30 | | - if (core_mask & RKNPU_CORE0_MASK) |
---|
| 30 | + switch (core_mask & ((1 << RKNPU_MAX_CORES) - 1)) { |
---|
| 31 | + case RKNPU_CORE0_MASK: |
---|
| 32 | + case RKNPU_CORE0_MASK | RKNPU_CORE1_MASK: |
---|
| 33 | + case RKNPU_CORE0_MASK | RKNPU_CORE1_MASK | RKNPU_CORE2_MASK: |
---|
31 | 34 | index = 0; |
---|
32 | | - else if (core_mask & RKNPU_CORE1_MASK) |
---|
| 35 | + break; |
---|
| 36 | + case RKNPU_CORE1_MASK: |
---|
33 | 37 | index = 1; |
---|
34 | | - else if (core_mask & RKNPU_CORE2_MASK) |
---|
| 38 | + break; |
---|
| 39 | + case RKNPU_CORE2_MASK: |
---|
35 | 40 | index = 2; |
---|
| 41 | + break; |
---|
| 42 | + default: |
---|
| 43 | + break; |
---|
| 44 | + } |
---|
36 | 45 | |
---|
37 | 46 | return index; |
---|
38 | 47 | } |
---|
.. | .. |
---|
58 | 67 | return core_mask; |
---|
59 | 68 | } |
---|
60 | 69 | |
---|
61 | | -static int rknn_get_task_number(struct rknpu_job *job, int core_index) |
---|
| 70 | +static int rknpu_get_task_number(struct rknpu_job *job, int core_index) |
---|
62 | 71 | { |
---|
| 72 | + struct rknpu_device *rknpu_dev = job->rknpu_dev; |
---|
63 | 73 | int task_num = job->args->task_number; |
---|
64 | 74 | |
---|
65 | | - if (job->use_core_num == 2) |
---|
66 | | - task_num = job->args->subcore_task[core_index].task_number; |
---|
67 | | - else if (job->use_core_num == 3) |
---|
68 | | - task_num = job->args->subcore_task[core_index + 2].task_number; |
---|
| 75 | + if (core_index >= RKNPU_MAX_CORES || core_index < 0) { |
---|
| 76 | + LOG_ERROR("core_index: %d set error!", core_index); |
---|
| 77 | + return 0; |
---|
| 78 | + } |
---|
| 79 | + |
---|
| 80 | + if (rknpu_dev->config->num_irqs > 1) { |
---|
| 81 | + if (job->use_core_num == 1 || job->use_core_num == 2) |
---|
| 82 | + task_num = |
---|
| 83 | + job->args->subcore_task[core_index].task_number; |
---|
| 84 | + else if (job->use_core_num == 3) |
---|
| 85 | + task_num = job->args->subcore_task[core_index + 2] |
---|
| 86 | + .task_number; |
---|
| 87 | + } |
---|
69 | 88 | |
---|
70 | 89 | return task_num; |
---|
71 | 90 | } |
---|
.. | .. |
---|
124 | 143 | job->use_core_num = (args->core_mask & RKNPU_CORE0_MASK) + |
---|
125 | 144 | ((args->core_mask & RKNPU_CORE1_MASK) >> 1) + |
---|
126 | 145 | ((args->core_mask & RKNPU_CORE2_MASK) >> 2); |
---|
127 | | - job->run_count = job->use_core_num; |
---|
128 | | - job->interrupt_count = job->use_core_num; |
---|
| 146 | + atomic_set(&job->run_count, job->use_core_num); |
---|
| 147 | + atomic_set(&job->interrupt_count, job->use_core_num); |
---|
129 | 148 | #ifdef CONFIG_ROCKCHIP_RKNPU_DRM_GEM |
---|
130 | 149 | task_obj = (struct rknpu_gem_object *)(uintptr_t)args->task_obj_addr; |
---|
131 | 150 | if (task_obj) |
---|
.. | .. |
---|
157 | 176 | struct rknpu_submit *args = job->args; |
---|
158 | 177 | struct rknpu_task *last_task = NULL; |
---|
159 | 178 | struct rknpu_subcore_data *subcore_data = NULL; |
---|
| 179 | + struct rknpu_job *entry, *q; |
---|
160 | 180 | void __iomem *rknpu_core_base = NULL; |
---|
161 | | - int core_index = rknpu_core_index(job->args->core_mask); |
---|
| 181 | + int core_index = rknpu_wait_core_index(job->args->core_mask); |
---|
162 | 182 | unsigned long flags; |
---|
163 | 183 | int wait_count = 0; |
---|
| 184 | + bool continue_wait = false; |
---|
164 | 185 | int ret = -EINVAL; |
---|
| 186 | + int i = 0; |
---|
165 | 187 | |
---|
166 | 188 | subcore_data = &rknpu_dev->subcore_datas[core_index]; |
---|
167 | 189 | |
---|
.. | .. |
---|
170 | 192 | job->flags & RKNPU_JOB_DONE || |
---|
171 | 193 | rknpu_dev->soft_reseting, |
---|
172 | 194 | msecs_to_jiffies(args->timeout)); |
---|
| 195 | + |
---|
173 | 196 | if (++wait_count >= 3) |
---|
174 | 197 | break; |
---|
175 | | - } while (ret == 0 && job->in_queue[core_index]); |
---|
176 | 198 | |
---|
177 | | - if (job->in_queue[core_index]) { |
---|
178 | | - spin_lock_irqsave(&rknpu_dev->lock, flags); |
---|
179 | | - list_del_init(&job->head[core_index]); |
---|
180 | | - subcore_data->task_num -= rknn_get_task_number(job, core_index); |
---|
181 | | - job->in_queue[core_index] = false; |
---|
182 | | - spin_unlock_irqrestore(&rknpu_dev->lock, flags); |
---|
183 | | - return ret < 0 ? ret : -EINVAL; |
---|
184 | | - } |
---|
| 199 | + if (ret == 0) { |
---|
| 200 | + int64_t commit_time = 0; |
---|
| 201 | + spin_lock_irqsave(&rknpu_dev->irq_lock, flags); |
---|
| 202 | + commit_time = ktime_us_delta(ktime_get(), |
---|
| 203 | + job->commit_pc_time); |
---|
| 204 | + continue_wait = |
---|
| 205 | + job->commit_pc_time == 0 ? |
---|
| 206 | + true : |
---|
| 207 | + (commit_time < args->timeout * 1000); |
---|
| 208 | + spin_unlock_irqrestore(&rknpu_dev->irq_lock, flags); |
---|
| 209 | + LOG_ERROR( |
---|
| 210 | + "job: %p, wait_count: %d, continue_wait: %d, commit time: %lldus, wait time: %lldus, timeout time: %uus\n", |
---|
| 211 | + job, wait_count, continue_wait, |
---|
| 212 | + (job->commit_pc_time == 0 ? 0 : commit_time), |
---|
| 213 | + ktime_us_delta(ktime_get(), job->timestamp), |
---|
| 214 | + args->timeout * 1000); |
---|
| 215 | + } |
---|
| 216 | + } while (ret == 0 && continue_wait); |
---|
185 | 217 | |
---|
186 | 218 | last_task = job->last_task; |
---|
187 | | - if (!last_task) |
---|
| 219 | + if (!last_task) { |
---|
| 220 | + spin_lock_irqsave(&rknpu_dev->lock, flags); |
---|
| 221 | + for (i = 0; i < job->use_core_num; i++) { |
---|
| 222 | + subcore_data = &rknpu_dev->subcore_datas[i]; |
---|
| 223 | + list_for_each_entry_safe( |
---|
| 224 | + entry, q, &subcore_data->todo_list, head[i]) { |
---|
| 225 | + if (entry == job) { |
---|
| 226 | + list_del(&job->head[i]); |
---|
| 227 | + break; |
---|
| 228 | + } |
---|
| 229 | + } |
---|
| 230 | + } |
---|
| 231 | + spin_unlock_irqrestore(&rknpu_dev->irq_lock, flags); |
---|
| 232 | + |
---|
| 233 | + LOG_ERROR("job commit failed\n"); |
---|
188 | 234 | return ret < 0 ? ret : -EINVAL; |
---|
| 235 | + } |
---|
189 | 236 | |
---|
190 | 237 | last_task->int_status = job->int_status[core_index]; |
---|
191 | 238 | |
---|
.. | .. |
---|
193 | 240 | args->task_counter = 0; |
---|
194 | 241 | rknpu_core_base = rknpu_dev->base[core_index]; |
---|
195 | 242 | if (args->flags & RKNPU_JOB_PC) { |
---|
196 | | - uint32_t task_status = |
---|
197 | | - REG_READ(RKNPU_OFFSET_PC_TASK_STATUS); |
---|
| 243 | + uint32_t task_status = REG_READ( |
---|
| 244 | + rknpu_dev->config->pc_task_status_offset); |
---|
198 | 245 | args->task_counter = |
---|
199 | 246 | (task_status & |
---|
200 | 247 | rknpu_dev->config->pc_task_number_mask); |
---|
.. | .. |
---|
203 | 250 | LOG_ERROR( |
---|
204 | 251 | "failed to wait job, task counter: %d, flags: %#x, ret = %d, elapsed time: %lldus\n", |
---|
205 | 252 | args->task_counter, args->flags, ret, |
---|
206 | | - ktime_to_us(ktime_sub(ktime_get(), job->timestamp))); |
---|
| 253 | + ktime_us_delta(ktime_get(), job->timestamp)); |
---|
207 | 254 | |
---|
208 | 255 | return ret < 0 ? ret : -ETIMEDOUT; |
---|
209 | 256 | } |
---|
.. | .. |
---|
216 | 263 | return 0; |
---|
217 | 264 | } |
---|
218 | 265 | |
---|
219 | | -static inline int rknpu_job_commit_pc(struct rknpu_job *job, int core_index) |
---|
| 266 | +static inline int rknpu_job_subcore_commit_pc(struct rknpu_job *job, |
---|
| 267 | + int core_index) |
---|
220 | 268 | { |
---|
221 | 269 | struct rknpu_device *rknpu_dev = job->rknpu_dev; |
---|
222 | 270 | struct rknpu_submit *args = job->args; |
---|
.. | .. |
---|
233 | 281 | struct rknpu_task *last_task = NULL; |
---|
234 | 282 | void __iomem *rknpu_core_base = rknpu_dev->base[core_index]; |
---|
235 | 283 | int task_start = args->task_start; |
---|
236 | | - int task_end = args->task_start + args->task_number - 1; |
---|
| 284 | + int task_end; |
---|
237 | 285 | int task_number = args->task_number; |
---|
238 | 286 | int task_pp_en = args->flags & RKNPU_JOB_PINGPONG ? 1 : 0; |
---|
239 | 287 | int pc_data_amount_scale = rknpu_dev->config->pc_data_amount_scale; |
---|
240 | 288 | int pc_task_number_bits = rknpu_dev->config->pc_task_number_bits; |
---|
241 | 289 | int i = 0; |
---|
| 290 | + int submit_index = atomic_read(&job->submit_count[core_index]); |
---|
| 291 | + int max_submit_number = rknpu_dev->config->max_submit_number; |
---|
242 | 292 | |
---|
243 | | - if (!task_obj) |
---|
244 | | - return -EINVAL; |
---|
| 293 | + if (!task_obj) { |
---|
| 294 | + job->ret = -EINVAL; |
---|
| 295 | + return job->ret; |
---|
| 296 | + } |
---|
245 | 297 | |
---|
246 | 298 | if (rknpu_dev->config->num_irqs > 1) { |
---|
247 | 299 | for (i = 0; i < rknpu_dev->config->num_irqs; i++) { |
---|
.. | .. |
---|
251 | 303 | } |
---|
252 | 304 | } |
---|
253 | 305 | |
---|
254 | | - if (job->use_core_num == 1) { |
---|
| 306 | + switch (job->use_core_num) { |
---|
| 307 | + case 1: |
---|
| 308 | + case 2: |
---|
255 | 309 | task_start = args->subcore_task[core_index].task_start; |
---|
256 | | - task_end = args->subcore_task[core_index].task_start + |
---|
257 | | - args->subcore_task[core_index].task_number - |
---|
258 | | - 1; |
---|
259 | 310 | task_number = |
---|
260 | 311 | args->subcore_task[core_index].task_number; |
---|
261 | | - } else if (job->use_core_num == 2) { |
---|
262 | | - task_start = args->subcore_task[core_index].task_start; |
---|
263 | | - task_end = args->subcore_task[core_index].task_start + |
---|
264 | | - args->subcore_task[core_index].task_number - |
---|
265 | | - 1; |
---|
266 | | - task_number = |
---|
267 | | - args->subcore_task[core_index].task_number; |
---|
268 | | - } else if (job->use_core_num == 3) { |
---|
| 312 | + break; |
---|
| 313 | + case 3: |
---|
269 | 314 | task_start = |
---|
270 | 315 | args->subcore_task[core_index + 2].task_start; |
---|
271 | | - task_end = |
---|
272 | | - args->subcore_task[core_index + 2].task_start + |
---|
273 | | - args->subcore_task[core_index + 2].task_number - |
---|
274 | | - 1; |
---|
275 | 316 | task_number = |
---|
276 | 317 | args->subcore_task[core_index + 2].task_number; |
---|
| 318 | + break; |
---|
| 319 | + default: |
---|
| 320 | + LOG_ERROR("Unknown use core num %d\n", |
---|
| 321 | + job->use_core_num); |
---|
| 322 | + break; |
---|
277 | 323 | } |
---|
278 | 324 | } |
---|
| 325 | + |
---|
| 326 | + task_start = task_start + submit_index * max_submit_number; |
---|
| 327 | + task_number = task_number - submit_index * max_submit_number; |
---|
| 328 | + task_number = task_number > max_submit_number ? max_submit_number : |
---|
| 329 | + task_number; |
---|
| 330 | + task_end = task_start + task_number - 1; |
---|
279 | 331 | |
---|
280 | 332 | task_base = task_obj->kv_addr; |
---|
281 | 333 | |
---|
282 | 334 | first_task = &task_base[task_start]; |
---|
283 | 335 | last_task = &task_base[task_end]; |
---|
284 | 336 | |
---|
| 337 | + spin_lock(&rknpu_dev->lock); |
---|
285 | 338 | REG_WRITE(first_task->regcmd_addr, RKNPU_OFFSET_PC_DATA_ADDR); |
---|
| 339 | + spin_unlock(&rknpu_dev->lock); |
---|
286 | 340 | |
---|
287 | 341 | REG_WRITE((first_task->regcfg_amount + RKNPU_PC_DATA_EXTRA_AMOUNT + |
---|
288 | 342 | pc_data_amount_scale - 1) / |
---|
.. | .. |
---|
309 | 363 | return 0; |
---|
310 | 364 | } |
---|
311 | 365 | |
---|
312 | | -static int rknpu_job_commit(struct rknpu_job *job, int core_index) |
---|
| 366 | +static inline int rknpu_job_subcore_commit(struct rknpu_job *job, int core_index) |
---|
313 | 367 | { |
---|
314 | 368 | struct rknpu_device *rknpu_dev = job->rknpu_dev; |
---|
315 | 369 | struct rknpu_submit *args = job->args; |
---|
316 | 370 | void __iomem *rknpu_core_base = rknpu_dev->base[core_index]; |
---|
317 | 371 | |
---|
318 | 372 | // switch to slave mode |
---|
| 373 | + spin_lock(&rknpu_dev->lock); |
---|
319 | 374 | REG_WRITE(0x1, RKNPU_OFFSET_PC_DATA_ADDR); |
---|
| 375 | + spin_unlock(&rknpu_dev->lock); |
---|
320 | 376 | |
---|
321 | | - if (!(args->flags & RKNPU_JOB_PC)) |
---|
322 | | - return -EINVAL; |
---|
| 377 | + if (!(args->flags & RKNPU_JOB_PC)) { |
---|
| 378 | + job->ret = -EINVAL; |
---|
| 379 | + return job->ret; |
---|
| 380 | + } |
---|
323 | 381 | |
---|
324 | | - return rknpu_job_commit_pc(job, core_index); |
---|
| 382 | + return rknpu_job_subcore_commit_pc(job, core_index); |
---|
| 383 | +} |
---|
| 384 | + |
---|
| 385 | +static void rknpu_job_commit(struct rknpu_job *job) |
---|
| 386 | +{ |
---|
| 387 | + switch (job->args->core_mask & ((1 << RKNPU_MAX_CORES) - 1)) { |
---|
| 388 | + case RKNPU_CORE0_MASK: |
---|
| 389 | + rknpu_job_subcore_commit(job, 0); |
---|
| 390 | + break; |
---|
| 391 | + case RKNPU_CORE1_MASK: |
---|
| 392 | + rknpu_job_subcore_commit(job, 1); |
---|
| 393 | + break; |
---|
| 394 | + case RKNPU_CORE2_MASK: |
---|
| 395 | + rknpu_job_subcore_commit(job, 2); |
---|
| 396 | + break; |
---|
| 397 | + case RKNPU_CORE0_MASK | RKNPU_CORE1_MASK: |
---|
| 398 | + rknpu_job_subcore_commit(job, 0); |
---|
| 399 | + rknpu_job_subcore_commit(job, 1); |
---|
| 400 | + break; |
---|
| 401 | + case RKNPU_CORE0_MASK | RKNPU_CORE1_MASK | RKNPU_CORE2_MASK: |
---|
| 402 | + rknpu_job_subcore_commit(job, 0); |
---|
| 403 | + rknpu_job_subcore_commit(job, 1); |
---|
| 404 | + rknpu_job_subcore_commit(job, 2); |
---|
| 405 | + break; |
---|
| 406 | + default: |
---|
| 407 | + LOG_ERROR("Unknown core mask: %d\n", job->args->core_mask); |
---|
| 408 | + break; |
---|
| 409 | + } |
---|
325 | 410 | } |
---|
326 | 411 | |
---|
327 | 412 | static void rknpu_job_next(struct rknpu_device *rknpu_dev, int core_index) |
---|
.. | .. |
---|
346 | 431 | head[core_index]); |
---|
347 | 432 | |
---|
348 | 433 | list_del_init(&job->head[core_index]); |
---|
349 | | - job->in_queue[core_index] = false; |
---|
350 | 434 | subcore_data->job = job; |
---|
351 | | - job->run_count--; |
---|
352 | 435 | job->hw_recoder_time = ktime_get(); |
---|
| 436 | + job->commit_pc_time = job->hw_recoder_time; |
---|
353 | 437 | spin_unlock_irqrestore(&rknpu_dev->irq_lock, flags); |
---|
354 | 438 | |
---|
355 | | - if (job->run_count == 0) { |
---|
356 | | - if (job->args->core_mask & RKNPU_CORE0_MASK) |
---|
357 | | - job->ret = rknpu_job_commit(job, 0); |
---|
358 | | - if (job->args->core_mask & RKNPU_CORE1_MASK) |
---|
359 | | - job->ret = rknpu_job_commit(job, 1); |
---|
360 | | - if (job->args->core_mask & RKNPU_CORE2_MASK) |
---|
361 | | - job->ret = rknpu_job_commit(job, 2); |
---|
| 439 | + if (atomic_dec_and_test(&job->run_count)) { |
---|
| 440 | + rknpu_job_commit(job); |
---|
362 | 441 | } |
---|
363 | 442 | } |
---|
364 | 443 | |
---|
.. | .. |
---|
367 | 446 | struct rknpu_device *rknpu_dev = job->rknpu_dev; |
---|
368 | 447 | struct rknpu_subcore_data *subcore_data = NULL; |
---|
369 | 448 | unsigned long flags; |
---|
370 | | - ktime_t now = ktime_get(); |
---|
| 449 | + int max_submit_number = rknpu_dev->config->max_submit_number; |
---|
| 450 | + |
---|
| 451 | + if (atomic_inc_return(&job->submit_count[core_index]) < |
---|
| 452 | + (rknpu_get_task_number(job, core_index) + max_submit_number - 1) / |
---|
| 453 | + max_submit_number) { |
---|
| 454 | + rknpu_job_commit(job); |
---|
| 455 | + return; |
---|
| 456 | + } |
---|
371 | 457 | |
---|
372 | 458 | subcore_data = &rknpu_dev->subcore_datas[core_index]; |
---|
373 | 459 | |
---|
374 | 460 | spin_lock_irqsave(&rknpu_dev->irq_lock, flags); |
---|
375 | 461 | subcore_data->job = NULL; |
---|
376 | | - subcore_data->task_num -= rknn_get_task_number(job, core_index); |
---|
377 | | - job->interrupt_count--; |
---|
| 462 | + subcore_data->task_num -= rknpu_get_task_number(job, core_index); |
---|
378 | 463 | subcore_data->timer.busy_time += |
---|
379 | | - ktime_us_delta(now, job->hw_recoder_time); |
---|
| 464 | + ktime_us_delta(ktime_get(), job->hw_recoder_time); |
---|
380 | 465 | spin_unlock_irqrestore(&rknpu_dev->irq_lock, flags); |
---|
381 | 466 | |
---|
382 | | - if (job->interrupt_count == 0) { |
---|
| 467 | + if (atomic_dec_and_test(&job->interrupt_count)) { |
---|
383 | 468 | int use_core_num = job->use_core_num; |
---|
384 | 469 | |
---|
385 | 470 | job->flags |= RKNPU_JOB_DONE; |
---|
.. | .. |
---|
409 | 494 | int task_num_list[3] = { 0, 1, 2 }; |
---|
410 | 495 | int tmp = 0; |
---|
411 | 496 | |
---|
412 | | - if ((job->args->core_mask & 0x07) == RKNPU_CORE_AUTO_MASK) { |
---|
| 497 | + if ((job->args->core_mask & ((1 << RKNPU_MAX_CORES) - 1)) == |
---|
| 498 | + RKNPU_CORE_AUTO_MASK) { |
---|
413 | 499 | if (rknpu_dev->subcore_datas[0].task_num > |
---|
414 | 500 | rknpu_dev->subcore_datas[1].task_num) { |
---|
415 | 501 | tmp = task_num_list[1]; |
---|
.. | .. |
---|
439 | 525 | |
---|
440 | 526 | job->args->core_mask = rknpu_core_mask(core_index); |
---|
441 | 527 | job->use_core_num = 1; |
---|
442 | | - job->interrupt_count = 1; |
---|
443 | | - job->run_count = 1; |
---|
| 528 | + atomic_set(&job->run_count, job->use_core_num); |
---|
| 529 | + atomic_set(&job->interrupt_count, job->use_core_num); |
---|
444 | 530 | } |
---|
445 | 531 | |
---|
| 532 | + spin_lock_irqsave(&rknpu_dev->irq_lock, flags); |
---|
446 | 533 | for (i = 0; i < rknpu_dev->config->num_irqs; i++) { |
---|
447 | 534 | if (job->args->core_mask & rknpu_core_mask(i)) { |
---|
448 | 535 | subcore_data = &rknpu_dev->subcore_datas[i]; |
---|
449 | | - spin_lock_irqsave(&rknpu_dev->irq_lock, flags); |
---|
450 | 536 | list_add_tail(&job->head[i], &subcore_data->todo_list); |
---|
451 | | - subcore_data->task_num += rknn_get_task_number(job, i); |
---|
452 | | - job->in_queue[i] = true; |
---|
453 | | - spin_unlock_irqrestore(&rknpu_dev->irq_lock, flags); |
---|
| 537 | + subcore_data->task_num += rknpu_get_task_number(job, i); |
---|
454 | 538 | } |
---|
455 | 539 | } |
---|
| 540 | + spin_unlock_irqrestore(&rknpu_dev->irq_lock, flags); |
---|
456 | 541 | |
---|
457 | 542 | for (i = 0; i < rknpu_dev->config->num_irqs; i++) { |
---|
458 | 543 | if (job->args->core_mask & rknpu_core_mask(i)) |
---|
.. | .. |
---|
464 | 549 | { |
---|
465 | 550 | struct rknpu_device *rknpu_dev = job->rknpu_dev; |
---|
466 | 551 | struct rknpu_subcore_data *subcore_data = NULL; |
---|
467 | | - int core_index = rknpu_core_index(job->args->core_mask); |
---|
468 | | - void __iomem *rknpu_core_base = rknpu_dev->base[core_index]; |
---|
469 | 552 | unsigned long flags; |
---|
470 | 553 | int i = 0; |
---|
471 | 554 | |
---|
472 | 555 | msleep(100); |
---|
473 | 556 | |
---|
| 557 | + spin_lock_irqsave(&rknpu_dev->irq_lock, flags); |
---|
474 | 558 | for (i = 0; i < rknpu_dev->config->num_irqs; i++) { |
---|
475 | 559 | if (job->args->core_mask & rknpu_core_mask(i)) { |
---|
476 | 560 | subcore_data = &rknpu_dev->subcore_datas[i]; |
---|
477 | | - spin_lock_irqsave(&rknpu_dev->irq_lock, flags); |
---|
478 | 561 | if (job == subcore_data->job && !job->irq_entry[i]) { |
---|
479 | 562 | subcore_data->job = NULL; |
---|
480 | 563 | subcore_data->task_num -= |
---|
481 | | - rknn_get_task_number(job, i); |
---|
| 564 | + rknpu_get_task_number(job, i); |
---|
482 | 565 | } |
---|
483 | | - spin_unlock_irqrestore(&rknpu_dev->irq_lock, flags); |
---|
484 | 566 | } |
---|
485 | 567 | } |
---|
| 568 | + spin_unlock_irqrestore(&rknpu_dev->irq_lock, flags); |
---|
486 | 569 | |
---|
487 | 570 | if (job->ret == -ETIMEDOUT) { |
---|
488 | | - LOG_ERROR( |
---|
489 | | - "job timeout, flags: %#x, irq status: %#x, raw status: %#x, require mask: %#x, task counter: %#x, elapsed time: %lldus\n", |
---|
490 | | - job->flags, REG_READ(RKNPU_OFFSET_INT_STATUS), |
---|
491 | | - REG_READ(RKNPU_OFFSET_INT_RAW_STATUS), |
---|
492 | | - job->int_mask[core_index], |
---|
493 | | - (REG_READ(RKNPU_OFFSET_PC_TASK_STATUS) & |
---|
494 | | - rknpu_dev->config->pc_task_number_mask), |
---|
495 | | - ktime_to_us(ktime_sub(ktime_get(), job->timestamp))); |
---|
| 571 | + LOG_ERROR("job timeout, flags: %#x:\n", job->flags); |
---|
| 572 | + for (i = 0; i < rknpu_dev->config->num_irqs; i++) { |
---|
| 573 | + if (job->args->core_mask & rknpu_core_mask(i)) { |
---|
| 574 | + void __iomem *rknpu_core_base = |
---|
| 575 | + rknpu_dev->base[i]; |
---|
| 576 | + LOG_ERROR( |
---|
| 577 | + "\tcore %d irq status: %#x, raw status: %#x, require mask: %#x, task counter: %#x, elapsed time: %lldus\n", |
---|
| 578 | + i, REG_READ(RKNPU_OFFSET_INT_STATUS), |
---|
| 579 | + REG_READ(RKNPU_OFFSET_INT_RAW_STATUS), |
---|
| 580 | + job->int_mask[i], |
---|
| 581 | + (REG_READ( |
---|
| 582 | + rknpu_dev->config |
---|
| 583 | + ->pc_task_status_offset) & |
---|
| 584 | + rknpu_dev->config->pc_task_number_mask), |
---|
| 585 | + ktime_us_delta(ktime_get(), |
---|
| 586 | + job->timestamp)); |
---|
| 587 | + } |
---|
| 588 | + } |
---|
496 | 589 | rknpu_soft_reset(rknpu_dev); |
---|
497 | 590 | } else { |
---|
498 | 591 | LOG_ERROR( |
---|
499 | 592 | "job abort, flags: %#x, ret: %d, elapsed time: %lldus\n", |
---|
500 | 593 | job->flags, job->ret, |
---|
501 | | - ktime_to_us(ktime_sub(ktime_get(), job->timestamp))); |
---|
| 594 | + ktime_us_delta(ktime_get(), job->timestamp)); |
---|
502 | 595 | } |
---|
503 | 596 | |
---|
504 | 597 | rknpu_job_cleanup(job); |
---|
.. | .. |
---|
560 | 653 | "invalid irq status: %#x, raw status: %#x, require mask: %#x, task counter: %#x\n", |
---|
561 | 654 | status, REG_READ(RKNPU_OFFSET_INT_RAW_STATUS), |
---|
562 | 655 | job->int_mask[core_index], |
---|
563 | | - (REG_READ(RKNPU_OFFSET_PC_TASK_STATUS) & |
---|
| 656 | + (REG_READ(rknpu_dev->config->pc_task_status_offset) & |
---|
564 | 657 | rknpu_dev->config->pc_task_number_mask)); |
---|
565 | 658 | REG_WRITE(RKNPU_INT_CLEAR, RKNPU_OFFSET_INT_CLEAR); |
---|
566 | 659 | return IRQ_HANDLED; |
---|
.. | .. |
---|
593 | 686 | { |
---|
594 | 687 | struct rknpu_job *job = NULL; |
---|
595 | 688 | unsigned long flags; |
---|
596 | | - ktime_t now = ktime_get(); |
---|
597 | 689 | struct rknpu_subcore_data *subcore_data = NULL; |
---|
598 | 690 | int i = 0; |
---|
599 | 691 | |
---|
.. | .. |
---|
602 | 694 | subcore_data = &rknpu_dev->subcore_datas[i]; |
---|
603 | 695 | job = subcore_data->job; |
---|
604 | 696 | if (job && |
---|
605 | | - ktime_to_ms(ktime_sub(now, job->timestamp)) >= |
---|
| 697 | + ktime_us_delta(ktime_get(), job->timestamp) >= |
---|
606 | 698 | job->args->timeout) { |
---|
607 | 699 | rknpu_soft_reset(rknpu_dev); |
---|
608 | 700 | |
---|
.. | .. |
---|
624 | 716 | struct rknpu_job, |
---|
625 | 717 | head[i]); |
---|
626 | 718 | list_del_init(&job->head[i]); |
---|
627 | | - job->in_queue[i] = false; |
---|
628 | 719 | } else { |
---|
629 | 720 | job = NULL; |
---|
630 | 721 | } |
---|
.. | .. |
---|
779 | 870 | return -EINVAL; |
---|
780 | 871 | |
---|
781 | 872 | *version = REG_READ(RKNPU_OFFSET_VERSION) + |
---|
782 | | - REG_READ(RKNPU_OFFSET_VERSION_NUM); |
---|
| 873 | + (REG_READ(RKNPU_OFFSET_VERSION_NUM) & 0xffff); |
---|
783 | 874 | |
---|
784 | 875 | return 0; |
---|
785 | 876 | } |
---|
.. | .. |
---|
853 | 944 | |
---|
854 | 945 | spin_lock(&rknpu_dev->lock); |
---|
855 | 946 | |
---|
856 | | - REG_WRITE(0x80000101, RKNPU_OFFSET_CLR_ALL_RW_AMOUNT); |
---|
857 | | - REG_WRITE(0x00000101, RKNPU_OFFSET_CLR_ALL_RW_AMOUNT); |
---|
| 947 | + if (rknpu_dev->config->pc_dma_ctrl) { |
---|
| 948 | + uint32_t pc_data_addr = REG_READ(RKNPU_OFFSET_PC_DATA_ADDR); |
---|
| 949 | + |
---|
| 950 | + REG_WRITE(0x1, RKNPU_OFFSET_PC_DATA_ADDR); |
---|
| 951 | + REG_WRITE(0x80000101, RKNPU_OFFSET_CLR_ALL_RW_AMOUNT); |
---|
| 952 | + REG_WRITE(0x00000101, RKNPU_OFFSET_CLR_ALL_RW_AMOUNT); |
---|
| 953 | + REG_WRITE(pc_data_addr, RKNPU_OFFSET_PC_DATA_ADDR); |
---|
| 954 | + } else { |
---|
| 955 | + REG_WRITE(0x80000101, RKNPU_OFFSET_CLR_ALL_RW_AMOUNT); |
---|
| 956 | + REG_WRITE(0x00000101, RKNPU_OFFSET_CLR_ALL_RW_AMOUNT); |
---|
| 957 | + } |
---|
858 | 958 | |
---|
859 | 959 | spin_unlock(&rknpu_dev->lock); |
---|
860 | 960 | |
---|