@@ -89,45 +89,74 @@ set(nvrtc_src
89
89
${PROJECT_BINARY_DIR} /include/af/version.h
90
90
91
91
${CMAKE_CURRENT_SOURCE_DIR} /Param.hpp
92
+ ${CMAKE_CURRENT_SOURCE_DIR} /assign_kernel_param.hpp
92
93
${CMAKE_CURRENT_SOURCE_DIR} /backend.hpp
94
+ ${CMAKE_CURRENT_SOURCE_DIR} /dims_param.hpp
93
95
${CMAKE_CURRENT_SOURCE_DIR} /kernel/interp.hpp
94
96
${CMAKE_CURRENT_SOURCE_DIR} /kernel/shared.hpp
95
97
${CMAKE_CURRENT_SOURCE_DIR} /math.hpp
98
+ ${CMAKE_CURRENT_SOURCE_DIR} /minmax_op.hpp
96
99
${CMAKE_CURRENT_SOURCE_DIR} /utility.hpp
97
100
${CMAKE_CURRENT_SOURCE_DIR} /types.hpp
98
101
${CMAKE_CURRENT_SOURCE_DIR} /../common/half.hpp
102
+ ${CMAKE_CURRENT_SOURCE_DIR} /../common/internal_enums.hpp
99
103
${CMAKE_CURRENT_SOURCE_DIR} /../common/kernel_type.hpp
100
104
101
105
${CMAKE_CURRENT_SOURCE_DIR} /kernel/anisotropic_diffusion.cuh
102
106
${CMAKE_CURRENT_SOURCE_DIR} /kernel/approx1.cuh
103
107
${CMAKE_CURRENT_SOURCE_DIR} /kernel/approx2.cuh
108
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/assign.cuh
104
109
${CMAKE_CURRENT_SOURCE_DIR} /kernel/bilateral.cuh
105
110
${CMAKE_CURRENT_SOURCE_DIR} /kernel/canny.cuh
106
111
${CMAKE_CURRENT_SOURCE_DIR} /kernel/convolve1.cuh
107
112
${CMAKE_CURRENT_SOURCE_DIR} /kernel/convolve2.cuh
108
113
${CMAKE_CURRENT_SOURCE_DIR} /kernel/convolve3.cuh
109
114
${CMAKE_CURRENT_SOURCE_DIR} /kernel/convolve_separable.cuh
115
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/copy.cuh
116
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/diagonal.cuh
117
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/diff.cuh
110
118
${CMAKE_CURRENT_SOURCE_DIR} /kernel/exampleFunction.cuh
119
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/fftconvolve.cuh
111
120
${CMAKE_CURRENT_SOURCE_DIR} /kernel/flood_fill.cuh
121
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/gradient.cuh
112
122
${CMAKE_CURRENT_SOURCE_DIR} /kernel/histogram.cuh
113
123
${CMAKE_CURRENT_SOURCE_DIR} /kernel/hsv_rgb.cuh
124
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/identity.cuh
125
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/iir.cuh
126
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/index.cuh
127
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/iota.cuh
128
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/ireduce.cuh
129
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/join.cuh
130
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/lookup.cuh
131
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/lu_split.cuh
114
132
${CMAKE_CURRENT_SOURCE_DIR} /kernel/match_template.cuh
115
133
${CMAKE_CURRENT_SOURCE_DIR} /kernel/meanshift.cuh
116
134
${CMAKE_CURRENT_SOURCE_DIR} /kernel/medfilt.cuh
135
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/memcopy.cuh
117
136
${CMAKE_CURRENT_SOURCE_DIR} /kernel/moments.cuh
118
137
${CMAKE_CURRENT_SOURCE_DIR} /kernel/morph.cuh
119
138
${CMAKE_CURRENT_SOURCE_DIR} /kernel/pad_array_borders.cuh
139
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/range.cuh
120
140
${CMAKE_CURRENT_SOURCE_DIR} /kernel/resize.cuh
141
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/reorder.cuh
121
142
${CMAKE_CURRENT_SOURCE_DIR} /kernel/rotate.cuh
143
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/select.cuh
122
144
${CMAKE_CURRENT_SOURCE_DIR} /kernel/scan_dim.cuh
123
145
${CMAKE_CURRENT_SOURCE_DIR} /kernel/scan_dim_by_key.cuh
124
146
${CMAKE_CURRENT_SOURCE_DIR} /kernel/scan_first.cuh
125
147
${CMAKE_CURRENT_SOURCE_DIR} /kernel/scan_first_by_key.cuh
126
148
${CMAKE_CURRENT_SOURCE_DIR} /kernel/sobel.cuh
149
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/sparse.cuh
150
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/sparse_arith.cuh
151
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/susan.cuh
152
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/tile.cuh
127
153
${CMAKE_CURRENT_SOURCE_DIR} /kernel/transform.cuh
128
154
${CMAKE_CURRENT_SOURCE_DIR} /kernel/transpose.cuh
129
155
${CMAKE_CURRENT_SOURCE_DIR} /kernel/transpose_inplace.cuh
156
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/triangle.cuh
157
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/unwrap.cuh
130
158
${CMAKE_CURRENT_SOURCE_DIR} /kernel/where.cuh
159
+ ${CMAKE_CURRENT_SOURCE_DIR} /kernel/wrap.cuh
131
160
)
132
161
133
162
file_to_string (
@@ -222,13 +251,9 @@ cuda_add_library(afcuda
222
251
anisotropic_diffusion.cpp
223
252
any.cu
224
253
approx.cpp
225
- assign.cu
226
254
bilateral.cpp
227
255
canny.cpp
228
- copy.cu
229
256
count.cu
230
- diagonal.cu
231
- diff.cu
232
257
dilate.cpp
233
258
dilate3d.cpp
234
259
erode.cpp
@@ -237,20 +262,10 @@ cuda_add_library(afcuda
237
262
Event.hpp
238
263
exampleFunction.cpp
239
264
fast.cu
240
- fftconvolve.cu
241
- gradient.cu
242
265
harris.cu
243
266
histogram.cpp
244
267
homography.cu
245
268
hsv_rgb.cpp
246
- identity.cu
247
- iir.cu
248
- index.cu
249
- iota.cu
250
- ireduce.cu
251
- join.cu
252
- lookup.cu
253
- lu.cu
254
269
match_template.cpp
255
270
max.cu
256
271
mean.cu
@@ -262,32 +277,21 @@ cuda_add_library(afcuda
262
277
orb.cu
263
278
pad_array_borders.cpp
264
279
product.cu
265
- qr.cu
266
280
random_engine.cu
267
- range.cu
268
281
regions.cu
269
- reorder.cu
270
282
resize.cpp
271
283
rotate.cpp
272
- select.cu
273
284
set .cu
274
285
sift.cu
275
286
sobel.cpp
276
287
sort .cu
277
288
sort_by_key.cu
278
289
sort_index.cu
279
- sparse.cu
280
- sparse_arith.cu
281
290
sum.cu
282
- susan.cu
283
- tile.cu
284
291
topk.cu
285
292
transform.cpp
286
293
transpose.cpp
287
294
transpose_inplace.cpp
288
- triangle.cu
289
- unwrap.cu
290
- wrap.cu
291
295
292
296
kernel/anisotropic_diffusion.hpp
293
297
kernel/approx.hpp
@@ -375,6 +379,7 @@ cuda_add_library(afcuda
375
379
anisotropic_diffusion.hpp
376
380
approx.hpp
377
381
arith.hpp
382
+ assign.cpp
378
383
assign.hpp
379
384
backend.hpp
380
385
bilateral.hpp
@@ -388,6 +393,7 @@ cuda_add_library(afcuda
388
393
complex.hpp
389
394
convolve.cpp
390
395
convolve.hpp
396
+ copy.cpp
391
397
copy.hpp
392
398
cublas.cpp
393
399
cublas.hpp
@@ -405,7 +411,9 @@ cuda_add_library(afcuda
405
411
device_manager.hpp
406
412
debug_cuda.hpp
407
413
debug_thrust.hpp
414
+ diagonal.cpp
408
415
diagonal.hpp
416
+ diff.cpp
409
417
diff.hpp
410
418
driver.cpp
411
419
err_cuda.hpp
@@ -415,11 +423,13 @@ cuda_add_library(afcuda
415
423
fast_pyramid.hpp
416
424
fft.cpp
417
425
fft.hpp
426
+ fftconvolve.cpp
418
427
fftconvolve.hpp
419
428
flood_fill.cpp
420
429
flood_fill.hpp
421
430
GraphicsResourceManager.cpp
422
431
GraphicsResourceManager.hpp
432
+ gradient.cpp
423
433
gradient.hpp
424
434
handle.cpp
425
435
harris.hpp
@@ -428,19 +438,27 @@ cuda_add_library(afcuda
428
438
histogram.hpp
429
439
homography.hpp
430
440
hsv_rgb.hpp
441
+ identity.cpp
431
442
identity.hpp
443
+ iir.cpp
432
444
iir.hpp
433
445
image.cpp
434
446
image.hpp
447
+ index.cpp
435
448
index.hpp
436
449
inverse.cpp
437
450
inverse.hpp
451
+ iota.cpp
438
452
iota.hpp
453
+ ireduce.cpp
439
454
ireduce.hpp
440
455
jit.cpp
456
+ join.cpp
441
457
join.hpp
442
458
logic.hpp
459
+ lookup.cpp
443
460
lookup.hpp
461
+ lu.cpp
444
462
lu.hpp
445
463
match_template.hpp
446
464
math .hpp
@@ -449,6 +467,7 @@ cuda_add_library(afcuda
449
467
medfilt.hpp
450
468
memory.cpp
451
469
memory.hpp
470
+ minmax_op.hpp
452
471
moments.hpp
453
472
morph.hpp
454
473
morph3d_impl.hpp
@@ -460,12 +479,15 @@ cuda_add_library(afcuda
460
479
plot.cpp
461
480
plot.hpp
462
481
print.hpp
482
+ qr.cpp
463
483
qr.hpp
464
484
random_engine.hpp
485
+ range.cpp
465
486
range.hpp
466
487
reduce.hpp
467
488
reduce_impl.hpp
468
489
regions.hpp
490
+ reorder.cpp
469
491
reorder.hpp
470
492
resize.hpp
471
493
rotate.hpp
@@ -474,6 +496,7 @@ cuda_add_library(afcuda
474
496
scan.hpp
475
497
scan_by_key.cpp
476
498
scan_by_key.hpp
499
+ select.cpp
477
500
select.hpp
478
501
set .hpp
479
502
shift.cpp
@@ -484,30 +507,37 @@ cuda_add_library(afcuda
484
507
solve.hpp
485
508
sort_by_key.hpp
486
509
sort_index.hpp
510
+ sparse.cpp
487
511
sparse.hpp
512
+ sparse_arith.cpp
488
513
sparse_arith.hpp
489
514
sparse_blas.cpp
490
515
sparse_blas.hpp
491
516
surface.cpp
492
517
surface.hpp
518
+ susan.cpp
493
519
susan.hpp
494
520
svd.cpp
495
521
svd.hpp
522
+ tile.cpp
496
523
tile.hpp
497
524
topk.hpp
498
525
traits.hpp
499
526
transform.hpp
500
527
transpose.hpp
528
+ triangle.cpp
501
529
triangle.hpp
502
530
types.hpp
503
531
unary.hpp
532
+ unwrap.cpp
504
533
unwrap.hpp
505
534
utility.cpp
506
535
utility.hpp
507
536
vector_field.cpp
508
537
vector_field.hpp
509
538
where.cpp
510
539
where.hpp
540
+ wrap.cpp
511
541
wrap.hpp
512
542
513
543
jit/BufferNode.hpp
0 commit comments