@@ -87,45 +87,74 @@ set(nvrtc_src
87
87
${PROJECT_BINARY_DIR} /include/af/version.h
88
88
89
89
${CMAKE_CURRENT_SOURCE_DIR} /Param.hpp
90
+ ${CMAKE_CURRENT_SOURCE_DIR} /assign_kernel_param.hpp
90
91
${CMAKE_CURRENT_SOURCE_DIR} /backend.hpp
92
+ ${CMAKE_CURRENT_SOURCE_DIR} /dims_param.hpp
91
93
${CMAKE_CURRENT_SOURCE_DIR} /kernel/interp.hpp
92
94
${CMAKE_CURRENT_SOURCE_DIR} /kernel/shared.hpp
93
95
${CMAKE_CURRENT_SOURCE_DIR} /math.hpp
96
+ ${CMAKE_CURRENT_SOURCE_DIR} /minmax_op.hpp
94
97
${CMAKE_CURRENT_SOURCE_DIR} /utility.hpp
95
98
${CMAKE_CURRENT_SOURCE_DIR} /types.hpp
96
99
${CMAKE_CURRENT_SOURCE_DIR} /../common/half.hpp
100
+ ${CMAKE_CURRENT_SOURCE_DIR} /../common/internal_enums.hpp
97
101
${CMAKE_CURRENT_SOURCE_DIR} /../common/kernel_type.hpp
98
102
99
103
${CMAKE_CURRENT_SOURCE_DIR} /kernel/anisotropic_diffusion.cuh
100
104
${CMAKE_CURRENT_SOURCE_DIR} /kernel/approx1.cuh
101
105
${CMAKE_CURRENT_SOURCE_DIR} /kernel/approx2.cuh
106
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/assign.cuh
102
107
${CMAKE_CURRENT_SOURCE_DIR} /kernel/bilateral.cuh
103
108
${CMAKE_CURRENT_SOURCE_DIR} /kernel/canny.cuh
104
109
${CMAKE_CURRENT_SOURCE_DIR} /kernel/convolve1.cuh
105
110
${CMAKE_CURRENT_SOURCE_DIR} /kernel/convolve2.cuh
106
111
${CMAKE_CURRENT_SOURCE_DIR} /kernel/convolve3.cuh
107
112
${CMAKE_CURRENT_SOURCE_DIR} /kernel/convolve_separable.cuh
113
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/copy.cuh
114
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/diagonal.cuh
115
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/diff.cuh
108
116
${CMAKE_CURRENT_SOURCE_DIR} /kernel/exampleFunction.cuh
117
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/fftconvolve.cuh
109
118
${CMAKE_CURRENT_SOURCE_DIR} /kernel/flood_fill.cuh
119
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/gradient.cuh
110
120
${CMAKE_CURRENT_SOURCE_DIR} /kernel/histogram.cuh
111
121
${CMAKE_CURRENT_SOURCE_DIR} /kernel/hsv_rgb.cuh
122
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/identity.cuh
123
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/iir.cuh
124
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/index.cuh
125
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/iota.cuh
126
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/ireduce.cuh
127
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/join.cuh
128
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/lookup.cuh
129
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/lu_split.cuh
112
130
${CMAKE_CURRENT_SOURCE_DIR} /kernel/match_template.cuh
113
131
${CMAKE_CURRENT_SOURCE_DIR} /kernel/meanshift.cuh
114
132
${CMAKE_CURRENT_SOURCE_DIR} /kernel/medfilt.cuh
133
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/memcopy.cuh
115
134
${CMAKE_CURRENT_SOURCE_DIR} /kernel/moments.cuh
116
135
${CMAKE_CURRENT_SOURCE_DIR} /kernel/morph.cuh
117
136
${CMAKE_CURRENT_SOURCE_DIR} /kernel/pad_array_borders.cuh
137
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/range.cuh
118
138
${CMAKE_CURRENT_SOURCE_DIR} /kernel/resize.cuh
139
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/reorder.cuh
119
140
${CMAKE_CURRENT_SOURCE_DIR} /kernel/rotate.cuh
141
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/select.cuh
120
142
${CMAKE_CURRENT_SOURCE_DIR} /kernel/scan_dim.cuh
121
143
${CMAKE_CURRENT_SOURCE_DIR} /kernel/scan_dim_by_key.cuh
122
144
${CMAKE_CURRENT_SOURCE_DIR} /kernel/scan_first.cuh
123
145
${CMAKE_CURRENT_SOURCE_DIR} /kernel/scan_first_by_key.cuh
124
146
${CMAKE_CURRENT_SOURCE_DIR} /kernel/sobel.cuh
147
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/sparse.cuh
148
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/sparse_arith.cuh
149
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/susan.cuh
150
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/tile.cuh
125
151
${CMAKE_CURRENT_SOURCE_DIR} /kernel/transform.cuh
126
152
${CMAKE_CURRENT_SOURCE_DIR} /kernel/transpose.cuh
127
153
${CMAKE_CURRENT_SOURCE_DIR} /kernel/transpose_inplace.cuh
154
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/triangle.cuh
155
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/unwrap.cuh
128
156
${CMAKE_CURRENT_SOURCE_DIR} /kernel/where.cuh
157
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/wrap.cuh
129
158
)
130
159
131
160
file_to_string (
@@ -220,13 +249,9 @@ cuda_add_library(afcuda
220
249
anisotropic_diffusion.cpp
221
250
any.cu
222
251
approx.cpp
223
- assign.cu
224
252
bilateral.cpp
225
253
canny.cpp
226
- copy.cu
227
254
count.cu
228
- diagonal.cu
229
- diff.cu
230
255
dilate.cpp
231
256
dilate3d.cpp
232
257
erode.cpp
@@ -235,20 +260,10 @@ cuda_add_library(afcuda
235
260
Event.hpp
236
261
exampleFunction.cpp
237
262
fast.cu
238
- fftconvolve.cu
239
- gradient.cu
240
263
harris.cu
241
264
histogram.cpp
242
265
homography.cu
243
266
hsv_rgb.cpp
244
- identity.cu
245
- iir.cu
246
- index.cu
247
- iota.cu
248
- ireduce.cu
249
- join.cu
250
- lookup.cu
251
- lu.cu
252
267
match_template.cpp
253
268
max.cu
254
269
mean.cu
@@ -260,32 +275,21 @@ cuda_add_library(afcuda
260
275
orb.cu
261
276
pad_array_borders.cpp
262
277
product.cu
263
- qr.cu
264
278
random_engine.cu
265
- range.cu
266
279
regions.cu
267
- reorder.cu
268
280
resize.cpp
269
281
rotate.cpp
270
- select.cu
271
282
set .cu
272
283
sift.cu
273
284
sobel.cpp
274
285
sort .cu
275
286
sort_by_key.cu
276
287
sort_index.cu
277
- sparse.cu
278
- sparse_arith.cu
279
288
sum.cu
280
- susan.cu
281
- tile.cu
282
289
topk.cu
283
290
transform.cpp
284
291
transpose.cpp
285
292
transpose_inplace.cpp
286
- triangle.cu
287
- unwrap.cu
288
- wrap.cu
289
293
290
294
kernel/anisotropic_diffusion.hpp
291
295
kernel/approx.hpp
@@ -373,6 +377,7 @@ cuda_add_library(afcuda
373
377
anisotropic_diffusion.hpp
374
378
approx.hpp
375
379
arith.hpp
380
+ assign.cpp
376
381
assign.hpp
377
382
backend.hpp
378
383
bilateral.hpp
@@ -386,6 +391,7 @@ cuda_add_library(afcuda
386
391
complex.hpp
387
392
convolve.cpp
388
393
convolve.hpp
394
+ copy.cpp
389
395
copy.hpp
390
396
cublas.cpp
391
397
cublas.hpp
@@ -403,7 +409,9 @@ cuda_add_library(afcuda
403
409
device_manager.hpp
404
410
debug_cuda.hpp
405
411
debug_thrust.hpp
412
+ diagonal.cpp
406
413
diagonal.hpp
414
+ diff.cpp
407
415
diff.hpp
408
416
driver.cpp
409
417
err_cuda.hpp
@@ -413,11 +421,13 @@ cuda_add_library(afcuda
413
421
fast_pyramid.hpp
414
422
fft.cpp
415
423
fft.hpp
424
+ fftconvolve.cpp
416
425
fftconvolve.hpp
417
426
flood_fill.cpp
418
427
flood_fill.hpp
419
428
GraphicsResourceManager.cpp
420
429
GraphicsResourceManager.hpp
430
+ gradient.cpp
421
431
gradient.hpp
422
432
handle.cpp
423
433
harris.hpp
@@ -426,19 +436,27 @@ cuda_add_library(afcuda
426
436
histogram.hpp
427
437
homography.hpp
428
438
hsv_rgb.hpp
439
+ identity.cpp
429
440
identity.hpp
441
+ iir.cpp
430
442
iir.hpp
431
443
image.cpp
432
444
image.hpp
445
+ index.cpp
433
446
index.hpp
434
447
inverse.cpp
435
448
inverse.hpp
449
+ iota.cpp
436
450
iota.hpp
451
+ ireduce.cpp
437
452
ireduce.hpp
438
453
jit.cpp
454
+ join.cpp
439
455
join.hpp
440
456
logic.hpp
457
+ lookup.cpp
441
458
lookup.hpp
459
+ lu.cpp
442
460
lu.hpp
443
461
match_template.hpp
444
462
math .hpp
@@ -447,6 +465,7 @@ cuda_add_library(afcuda
447
465
medfilt.hpp
448
466
memory.cpp
449
467
memory.hpp
468
+ minmax_op.hpp
450
469
moments.hpp
451
470
morph.hpp
452
471
morph3d_impl.hpp
@@ -458,12 +477,15 @@ cuda_add_library(afcuda
458
477
plot.cpp
459
478
plot.hpp
460
479
print.hpp
480
+ qr.cpp
461
481
qr.hpp
462
482
random_engine.hpp
483
+ range.cpp
463
484
range.hpp
464
485
reduce.hpp
465
486
reduce_impl.hpp
466
487
regions.hpp
488
+ reorder.cpp
467
489
reorder.hpp
468
490
resize.hpp
469
491
rotate.hpp
@@ -472,6 +494,7 @@ cuda_add_library(afcuda
472
494
scan.hpp
473
495
scan_by_key.cpp
474
496
scan_by_key.hpp
497
+ select.cpp
475
498
select.hpp
476
499
set .hpp
477
500
shift.cpp
@@ -482,30 +505,37 @@ cuda_add_library(afcuda
482
505
solve.hpp
483
506
sort_by_key.hpp
484
507
sort_index.hpp
508
+ sparse.cpp
485
509
sparse.hpp
510
+ sparse_arith.cpp
486
511
sparse_arith.hpp
487
512
sparse_blas.cpp
488
513
sparse_blas.hpp
489
514
surface.cpp
490
515
surface.hpp
516
+ susan.cpp
491
517
susan.hpp
492
518
svd.cpp
493
519
svd.hpp
520
+ tile.cpp
494
521
tile.hpp
495
522
topk.hpp
496
523
traits.hpp
497
524
transform.hpp
498
525
transpose.hpp
526
+ triangle.cpp
499
527
triangle.hpp
500
528
types.hpp
501
529
unary.hpp
530
+ unwrap.cpp
502
531
unwrap.hpp
503
532
utility.cpp
504
533
utility.hpp
505
534
vector_field.cpp
506
535
vector_field.hpp
507
536
where.cpp
508
537
where.hpp
538
+ wrap.cpp
509
539
wrap.hpp
510
540
511
541
jit/BufferNode.hpp
0 commit comments