..
|
hip
|
quantized
|
rnn
|
CMakeLists.txt
|
abs_op.cc
|
abs_op.cu
|
abs_op.h
|
accumulate_op.cc
|
accumulate_op.cu
|
accumulate_op.h
|
accuracy_op.cc
|
accuracy_op.cu
|
accuracy_op.h
|
acos_op.cc
|
acos_op.cu
|
acos_op.h
|
activation_ops_cudnn.h
|
affine_channel_op.cc
|
affine_channel_op.cu
|
affine_channel_op.h
|
alias_with_name.cc
|
alias_with_name.cu
|
alias_with_name.h
|
apmeter_op.cc
|
apmeter_op.h
|
arg_ops.cc
|
arg_ops.cu
|
arg_ops.h
|
asin_op.cc
|
asin_op.cu
|
asin_op.h
|
assert_op.cc
|
assert_op.cu
|
assert_op.h
|
atan_op.cc
|
atan_op.cu
|
atan_op.h
|
atomic_ops.cc
|
batch_box_cox_op.cc
|
batch_box_cox_op.h
|
batch_bucketize_op.cc
|
batch_bucketize_op.h
|
batch_gather_ops.cc
|
batch_gather_ops.cu
|
batch_gather_ops.h
|
batch_matmul_op.cc
|
batch_matmul_op.cu
|
batch_matmul_op.h
|
batch_matmul_op_gpu_test.cc
|
batch_matmul_op_test.cc
|
batch_moments_op.cc
|
batch_moments_op.cu
|
batch_moments_op.h
|
batch_permutation_op.cc
|
batch_permutation_op.cu
|
batch_permutation_op.h
|
batch_permutation_op_gpu_test.cc
|
batch_sparse_to_dense_op.cc
|
batch_sparse_to_dense_op.cu
|
batch_sparse_to_dense_op.h
|
bbox_transform_op.cc
|
bbox_transform_op.h
|
bisect_percentile_op.cc
|
bisect_percentile_op.h
|
boolean_mask_ops.cc
|
boolean_mask_ops.cu
|
boolean_mask_ops.h
|
boolean_unmask_ops.cc
|
boolean_unmask_ops.cu
|
boolean_unmask_ops.h
|
boolean_unmask_ops_test.cc
|
box_with_nms_limit_op.cc
|
box_with_nms_limit_op.h
|
bucketize_op.cc
|
bucketize_op.cu
|
bucketize_op.h
|
byte_weight_dequant_op.cc
|
byte_weight_dequant_op.h
|
cast_op.cc
|
cast_op.cu
|
cast_op.h
|
cbrt_op.cc
|
cbrt_op.cu
|
cbrt_op.h
|
cc_bmm_bg_op.cc
|
cc_bmm_bg_op.h
|
ceil_op.cc
|
ceil_op.cu
|
ceil_op.h
|
channel_backprop_stats_op.cc
|
channel_backprop_stats_op.cu
|
channel_backprop_stats_op.h
|
channel_shuffle_op.cc
|
channel_shuffle_op.cu
|
channel_shuffle_op.h
|
channel_stats_op.cc
|
channel_stats_op.cu
|
channel_stats_op.h
|
channelwise_conv3d_op_cudnn.cu
|
clip_op.cc
|
clip_op.cu
|
clip_op.h
|
collect_and_distribute_fpn_rpn_proposals_op.cc
|
collect_and_distribute_fpn_rpn_proposals_op.h
|
communicator_op.cc
|
communicator_op_gpu.cc
|
concat_split_op.cc
|
concat_split_op.h
|
concat_split_op_gpu.cc
|
conditional_op.cc
|
conditional_op.h
|
conv_gradient_op.cc
|
conv_op.cc
|
conv_op.h
|
conv_op_cache_cudnn.cc
|
conv_op_cache_cudnn.h
|
conv_op_cache_cudnn_test.cc
|
conv_op_cudnn.cc
|
conv_op_eigen.cc
|
conv_op_gpu.cc
|
conv_op_impl.h
|
conv_op_shared.cc
|
conv_op_shared.h
|
conv_op_shared_gpu.cc
|
conv_pool_op_base.h
|
conv_transpose_gradient_op.cc
|
conv_transpose_op.cc
|
conv_transpose_op.h
|
conv_transpose_op_cudnn.cc
|
conv_transpose_op_gpu.cc
|
conv_transpose_op_impl.h
|
conv_transpose_op_mobile.cc
|
conv_transpose_op_mobile.h
|
conv_transpose_op_mobile_impl.h
|
conv_transpose_op_mobile_test.cc
|
conv_transpose_unpool_op_base.h
|
copy_op.cc
|
copy_op.cu
|
copy_op.h
|
copy_rows_to_tensor_op.cc
|
copy_rows_to_tensor_op.h
|
cos_op.cc
|
cos_op.cu
|
cos_op.h
|
cosh_op.cc
|
cosh_op.cu
|
cosh_op.h
|
cosine_embedding_criterion_op.cc
|
cosine_embedding_criterion_op.cu
|
cosine_embedding_criterion_op.h
|
counter_ops.cc
|
counter_ops.h
|
counter_ops_gpu.cc
|
crash_op.cc
|
create_scope_op.cc
|
create_scope_op.h
|
crf_viterbi_op.cc
|
cross_entropy_op.cc
|
cross_entropy_op.cu
|
cross_entropy_op.h
|
ctc_beam_search_decoder_op.cc
|
ctc_beam_search_decoder_op.h
|
ctc_greedy_decoder_op.cc
|
ctc_greedy_decoder_op.h
|
cube_op.cc
|
cube_op.cu
|
cube_op.h
|
data_couple.cc
|
data_couple.h
|
data_couple_gpu.cu
|
dataset_ops.cc
|
dataset_ops.h
|
deform_conv_gradient_op.cc
|
deform_conv_op.cc
|
deform_conv_op.cu
|
deform_conv_op.h
|
deform_conv_op_impl.h
|
dense_vector_to_id_list_op.cc
|
dense_vector_to_id_list_op.h
|
depthwise_3x3_conv_op_cudnn.cu
|
distance_op.cc
|
distance_op.cu
|
distance_op.h
|
do_op.cc
|
do_op.h
|
do_op_gpu.cc
|
dropout_op.cc
|
dropout_op.cu
|
dropout_op.h
|
dropout_op_cudnn.cc
|
elementwise_add_gradient_op.cc
|
elementwise_add_op.cc
|
elementwise_add_op.h
|
elementwise_add_op_gpu.cc
|
elementwise_div_gradient_op.cc
|
elementwise_div_op.cc
|
elementwise_div_op.cu
|
elementwise_div_op.h
|
elementwise_linear_op.cc
|
elementwise_linear_op.cu
|
elementwise_linear_op.h
|
elementwise_logical_ops.cc
|
elementwise_logical_ops.h
|
elementwise_mul_gradient_op.cc
|
elementwise_mul_op.cc
|
elementwise_mul_op.cu
|
elementwise_mul_op.h
|
elementwise_op_gpu_test.cc
|
elementwise_op_test.cc
|
elementwise_op_test.h
|
elementwise_ops.cc
|
elementwise_ops.cu
|
elementwise_ops.h
|
elementwise_ops_schema.cc
|
elementwise_ops_utils.cc
|
elementwise_ops_utils.h
|
elementwise_sub_gradient_op.cc
|
elementwise_sub_op.cc
|
elementwise_sub_op.h
|
elementwise_sub_op_gpu.cc
|
elementwise_sum_op.cc
|
elu_op.cc
|
elu_op.cu
|
elu_op.h
|
elu_op_cudnn.cc
|
enforce_finite_op.cc
|
enforce_finite_op.cu
|
enforce_finite_op.h
|
ensure_clipped_op.cc
|
ensure_clipped_op.h
|
ensure_cpu_output_op.cc
|
ensure_cpu_output_op.cu
|
ensure_cpu_output_op.h
|
erf_op.cc
|
erf_op.cu
|
erf_op.h
|
exp_op.cc
|
exp_op.h
|
exp_op_gpu.cc
|
expand_op.cc
|
expand_op.h
|
expand_op_gpu.cc
|
expand_squeeze_dims_op.cc
|
expand_squeeze_dims_op.h
|
expand_squeeze_dims_op_gpu.cc
|
fc_inference.cc
|
fc_inference.h
|
feature_maps_ops.cc
|
feature_maps_ops.h
|
feed_blob_op.cc
|
feed_blob_op.h
|
filler_op.cc
|
filler_op.cu
|
filler_op.h
|
find_duplicate_elements_op.cc
|
find_duplicate_elements_op.h
|
find_op.cc
|
find_op.cu
|
find_op.h
|
flatten_op.cc
|
flatten_op.h
|
flexible_top_k.cc
|
flexible_top_k.h
|
floor_op.cc
|
floor_op.cu
|
floor_op.h
|
free_op.cc
|
free_op.h
|
free_op_gpu.cc
|
fully_connected_op.cc
|
fully_connected_op.h
|
fully_connected_op_gpu.cc
|
fused_rowwise_8bit_conversion_ops.cc
|
fused_rowwise_8bit_conversion_ops.h
|
fused_rowwise_nbit_conversion_ops.cc
|
fused_rowwise_nbit_conversion_ops.h
|
fused_rowwise_nbitfake_conversion_ops.cc
|
fused_rowwise_nbitfake_conversion_ops.h
|
fused_rowwise_random_quantization_ops.cc
|
fused_rowwise_random_quantization_ops.h
|
gather_fused_8bit_rowwise_op.cc
|
gather_fused_8bit_rowwise_op.h
|
gather_op.cc
|
gather_op.cu
|
gather_op.cuh
|
gather_op.h
|
gather_ranges_to_dense_op.cc
|
gather_ranges_to_dense_op.h
|
gelu_op.cc
|
gelu_op.cu
|
gelu_op.h
|
generate_proposals_op.cc
|
generate_proposals_op.cu
|
generate_proposals_op.h
|
generate_proposals_op_gpu_test.cc
|
generate_proposals_op_test.cc
|
generate_proposals_op_util_boxes.h
|
generate_proposals_op_util_boxes_test.cc
|
generate_proposals_op_util_nms.h
|
generate_proposals_op_util_nms_gpu.cu
|
generate_proposals_op_util_nms_gpu.h
|
generate_proposals_op_util_nms_gpu_test.cc
|
generate_proposals_op_util_nms_test.cc
|
given_tensor_byte_string_to_uint8_fill_op.cc
|
given_tensor_byte_string_to_uint8_fill_op.cu
|
given_tensor_byte_string_to_uint8_fill_op.h
|
given_tensor_fill_op.cc
|
given_tensor_fill_op.cu
|
given_tensor_fill_op.h
|
glu_op.cc
|
glu_op.cu
|
glu_op.h
|
group_norm_op.cc
|
group_norm_op.cu
|
group_norm_op.h
|
gru_unit_op.cc
|
gru_unit_op.h
|
gru_unit_op_gpu.cu
|
h_softmax_op.cc
|
h_softmax_op.h
|
half_float_ops.cc
|
half_float_ops.cu
|
half_float_ops.h
|
half_float_ops_test.cc
|
hard_sigmoid_op.cc
|
hard_sigmoid_op.cu
|
hard_sigmoid_op.h
|
heatmap_max_keypoint_op.cc
|
heatmap_max_keypoint_op.h
|
histogram_op.cc
|
histogram_op.h
|
if_op.cc
|
if_op.h
|
if_op_gpu.cc
|
im2col_op.cc
|
im2col_op.h
|
im2col_op_gpu.cc
|
index_hash_ops.cc
|
index_hash_ops.h
|
index_ops.cc
|
index_ops.h
|
inference_lstm_op.cc
|
inference_lstm_op.h
|
instance_norm_gradient_op.cc
|
instance_norm_op.cc
|
instance_norm_op.cu
|
instance_norm_op.h
|
integral_image_op.cc
|
integral_image_op.cu
|
integral_image_op.h
|
is_empty_op.cc
|
is_empty_op.h
|
jsd_op.cc
|
jsd_op.h
|
key_split_ops.cc
|
key_split_ops.h
|
last_n_window_collector.cc
|
layer_norm_op.cc
|
layer_norm_op.cu
|
layer_norm_op.h
|
leaky_relu_op.cc
|
leaky_relu_op.cu
|
leaky_relu_op.h
|
length_split_op.cc
|
length_split_op.h
|
lengths_pad_op.cc
|
lengths_pad_op.cu
|
lengths_pad_op.h
|
lengths_reducer_fused_8bit_rowwise_ops.cc
|
lengths_reducer_fused_8bit_rowwise_ops.h
|
lengths_reducer_fused_nbit_rowwise_ops.cc
|
lengths_reducer_fused_nbit_rowwise_ops.h
|
lengths_reducer_ops.cc
|
lengths_reducer_ops.h
|
lengths_reducer_rowwise_8bit_ops.cc
|
lengths_reducer_rowwise_8bit_ops.h
|
lengths_tile_op.cc
|
lengths_tile_op.cu
|
lengths_tile_op.h
|
lengths_top_k_op.cc
|
lengths_top_k_op.h
|
listwise_l2r_op.cc
|
listwise_l2r_op.h
|
load_save_op.cc
|
load_save_op.h
|
load_save_op_gpu.cc
|
load_save_op_util.cc
|
load_save_op_util.h
|
local_response_normalization_op.cc
|
local_response_normalization_op.cu
|
local_response_normalization_op.h
|
local_response_normalization_op_cudnn.cc
|
locally_connected_op.cc
|
locally_connected_op.h
|
locally_connected_op_gpu.cc
|
locally_connected_op_impl.h
|
locally_connected_op_util.cc
|
locally_connected_op_util.h
|
log_op.cc
|
log_op.h
|
log_op_gpu.cc
|
logit_op.cc
|
logit_op.cu
|
logit_op.h
|
loss_op.cc
|
loss_op.cu
|
loss_op.h
|
lp_pool_op.cc
|
lp_pool_op.cu
|
lpnorm_op.cc
|
lpnorm_op.cu
|
lpnorm_op.h
|
lstm_unit_op.cc
|
lstm_unit_op.h
|
lstm_unit_op_gpu.cu
|
lstm_utils.h
|
map_ops.cc
|
map_ops.h
|
margin_ranking_criterion_op.cc
|
margin_ranking_criterion_op.cu
|
margin_ranking_criterion_op.h
|
matmul_op.cc
|
matmul_op.h
|
matmul_op_gpu.cc
|
max_pool_with_index.cu
|
max_pool_with_index_gpu.h
|
mean_op.cc
|
mean_op.cu
|
mean_op.h
|
mem_query_op.cu
|
merge_id_lists_op.cc
|
merge_id_lists_op.h
|
minmax_gradient_ops.cc
|
minmax_ops.cc
|
minmax_ops.cu
|
minmax_ops.h
|
mish_op.cc
|
mish_op.h
|
mod_op.cc
|
mod_op.h
|
moments_op.cc
|
moments_op.cu
|
moments_op.h
|
multi_class_accuracy_op.cc
|
multi_class_accuracy_op.cu
|
multi_class_accuracy_op.h
|
negate_gradient_op.cc
|
negate_gradient_op.h
|
negate_gradient_op_gpu.cc
|
negative_op.cc
|
negative_op.h
|
negative_op_gpu.cc
|
ngram_ops.cc
|
ngram_ops.h
|
no_default_engine_op.h
|
norm_planar_yuv_op.cc
|
normalize_l1_op.cc
|
normalize_l1_op.h
|
normalize_op.cc
|
normalize_op.h
|
normalize_ops.cu
|
numpy_tile_op.cc
|
numpy_tile_op.h
|
one_hot_ops.cc
|
one_hot_ops.cu
|
one_hot_ops.h
|
onnx_while_op.cc
|
onnx_while_op.h
|
op_utils_cudnn.h
|
operator_fallback_gpu.h
|
operator_fallback_gpu_test.cc
|
order_switch_ops.cc
|
order_switch_ops.h
|
order_switch_ops_cudnn.cc
|
order_switch_ops_gpu.cc
|
pack_rnn_sequence_op.cc
|
pack_rnn_sequence_op.h
|
pack_segments.cc
|
pack_segments.cu
|
pack_segments.h
|
pad_op.cc
|
pad_op.h
|
pad_op_gpu.cu
|
partition_ops.cc
|
partition_ops.h
|
percentile_op.cc
|
percentile_op.h
|
perplexity_op.cc
|
perplexity_op.cu
|
perplexity_op.h
|
piecewise_linear_transform_op.cc
|
piecewise_linear_transform_op.cu
|
piecewise_linear_transform_op.h
|
pool_gradient_op.cc
|
pool_op.cc
|
pool_op.cu
|
pool_op.h
|
pool_op_cudnn.cc
|
pool_op_util.cc
|
pool_op_util.h
|
pow_op.cc
|
pow_op.cu
|
pow_op.h
|
prefetch_op.h
|
prelu_op.cc
|
prelu_op.cu
|
prelu_op.h
|
prepend_dim_op.cc
|
prepend_dim_op.h
|
prepend_dim_op_gpu.cc
|
quant_decode_op.cc
|
quant_decode_op.h
|
quantile_op.cc
|
quantile_op.h
|
rank_loss_op.cc
|
rank_loss_op.h
|
reciprocal_gradient_op.cc
|
reciprocal_op.cc
|
reciprocal_op.cu
|
reciprocal_op.h
|
reduce_front_back_max_ops.cc
|
reduce_front_back_max_ops.cu
|
reduce_front_back_max_ops.h
|
reduce_front_back_mean_ops.cc
|
reduce_front_back_sum_mean_ops.cu
|
reduce_front_back_sum_mean_ops.h
|
reduce_front_back_sum_ops.cc
|
reduce_ops.cc
|
reduce_ops.cu
|
reduce_ops.h
|
reducer_functors.h
|
reduction_ops.cc
|
reduction_ops.cu
|
reduction_ops.h
|
relu_n_op.cc
|
relu_n_op.cu
|
relu_n_op.h
|
relu_op.cc
|
relu_op.cu
|
relu_op.h
|
remove_data_blocks_op.cc
|
remove_data_blocks_op.h
|
replace_nan_op.cc
|
replace_nan_op.cu
|
replace_nan_op.h
|
reservoir_sampling.cc
|
reshape_op.cc
|
reshape_op.h
|
reshape_op_gpu.cc
|
reshape_op_gpu_test.cc
|
resize_3d_op.cc
|
resize_3d_op.cu
|
resize_3d_op.h
|
resize_op.cc
|
resize_op.cu
|
resize_op.h
|
reverse_packed_segs_op.cc
|
reverse_packed_segs_op.cu
|
reverse_packed_segs_op.h
|
rmac_regions_op.cc
|
rmac_regions_op.cu
|
rmac_regions_op.h
|
rms_norm_op.cc
|
rms_norm_op.cu
|
rms_norm_op.h
|
roi_align_gradient_op.cc
|
roi_align_gradient_op.cu
|
roi_align_gradient_op.h
|
roi_align_op.cc
|
roi_align_op.cu
|
roi_align_op.h
|
roi_align_op_gpu_test.cc
|
roi_align_rotated_gradient_op.cc
|
roi_align_rotated_gradient_op.cu
|
roi_align_rotated_gradient_op.h
|
roi_align_rotated_op.cc
|
roi_align_rotated_op.cu
|
roi_align_rotated_op.h
|
roi_pool_op.cc
|
roi_pool_op.cu
|
roi_pool_op.h
|
rowmul_op.cc
|
rowmul_op.h
|
rsqrt_op.cc
|
rsqrt_op.cu
|
rsqrt_op.h
|
scale_blobs_op.cc
|
scale_blobs_op.cu
|
scale_blobs_op.h
|
scale_op.cc
|
scale_op.h
|
scale_op_gpu.cc
|
segment_reduction_op.cc
|
segment_reduction_op.h
|
segment_reduction_op_gpu.cu
|
segment_reduction_op_gpu.cuh
|
self_binning_histogram_op.cc
|
self_binning_histogram_op.h
|
selu_op.cc
|
selu_op.cu
|
selu_op.h
|
sequence_ops.cc
|
sequence_ops.cu
|
sequence_ops.h
|
shape_op.cc
|
shape_op.h
|
shape_op_gpu.cc
|
sigmoid_gradient_op.cc
|
sigmoid_op.cc
|
sigmoid_op.cu
|
sigmoid_op.h
|
sigmoid_op_cudnn.cc
|
sin_op.cc
|
sin_op.cu
|
sin_op.h
|
sinh_op.cc
|
sinh_op.cu
|
sinh_op.h
|
sinusoid_position_encoding_op.cc
|
sinusoid_position_encoding_op.h
|
slice_op.cc
|
slice_op.cu
|
slice_op.h
|
softmax_op.cc
|
softmax_op.h
|
softmax_op_cudnn.cc
|
softmax_ops.cu
|
softmax_utils.cc
|
softmax_utils.h
|
softmax_with_loss_op.cc
|
softmax_with_loss_op.h
|
softplus_op.cc
|
softplus_op.cu
|
softplus_op.h
|
softsign_op.cc
|
softsign_op.cu
|
softsign_op.h
|
space_batch_op.cc
|
space_batch_op.h
|
space_batch_op_gpu.cu
|
sparse_dropout_with_replacement_op.cc
|
sparse_dropout_with_replacement_op.h
|
sparse_lp_regularizer_op.cc
|
sparse_lp_regularizer_op.h
|
sparse_lp_regularizer_op_gpu.cu
|
sparse_normalize_op.cc
|
sparse_normalize_op.h
|
sparse_normalize_op_gpu.cu
|
sparse_to_dense_mask_op.cc
|
sparse_to_dense_mask_op.h
|
sparse_to_dense_op.cc
|
sparse_to_dense_op.cu
|
sparse_to_dense_op.h
|
spatial_batch_norm_gradient_op.cc
|
spatial_batch_norm_op.cc
|
spatial_batch_norm_op.cu
|
spatial_batch_norm_op.h
|
spatial_batch_norm_op_cudnn.cu
|
spatial_batch_norm_op_impl.cuh
|
spatial_softmax_with_loss_op.cc
|
spatial_softmax_with_loss_op.h
|
sqr_op.cc
|
sqr_op.h
|
sqr_op_gpu.cc
|
sqrt_op.cc
|
sqrt_op.h
|
sqrt_op_gpu.cc
|
square_root_divide_op.cc
|
square_root_divide_op.h
|
stats_ops.cc
|
stats_put_ops.cc
|
stats_put_ops.h
|
stop_gradient.cc
|
stop_gradient.h
|
stop_gradient_gpu.cc
|
string_ops.cc
|
string_ops.h
|
string_ops_test.cc
|
stump_func_op.cc
|
stump_func_op.cu
|
stump_func_op.h
|
stylizer_ops.cc
|
summarize_op.cc
|
summarize_op.cu
|
summarize_op.h
|
swish_op.cc
|
swish_op.cu
|
swish_op.h
|
tan_op.cc
|
tan_op.cu
|
tan_op.h
|
tanh_gradient_op.cc
|
tanh_op.cc
|
tanh_op.cu
|
tanh_op.h
|
tanh_op_cudnn.cc
|
tensor_protos_db_input.cc
|
tensor_protos_db_input.h
|
tensor_protos_db_input_gpu.cc
|
text_file_reader.cc
|
text_file_reader_utils.cc
|
text_file_reader_utils.h
|
text_file_reader_utils_test.cc
|
thresholded_relu_op.cc
|
thresholded_relu_op.cu
|
thresholded_relu_op.h
|
tile_op.cc
|
tile_op.cu
|
tile_op.h
|
top_k.cc
|
top_k.cu
|
top_k.h
|
top_k_heap_selection.cuh
|
top_k_radix_selection.cuh
|
transpose_op.cc
|
transpose_op.cu
|
transpose_op.h
|
transpose_op_cudnn.cc
|
tt_linear_op.cc
|
tt_linear_op.h
|
unique_ops.cc
|
unique_ops.cu
|
unique_ops.h
|
upsample_op.cc
|
upsample_op.cu
|
upsample_op.h
|
utility_ops.cc
|
utility_ops.cu
|
utility_ops.h
|
utility_ops_gpu_test.cc
|
utility_ops_test.cc
|
variable_length_sequence_padding.cc
|
variable_length_sequence_padding.h
|
weighted_multi_sampling_op.cc
|
weighted_multi_sampling_op.h
|
weighted_sample_op.cc
|
weighted_sample_op.cu
|
weighted_sample_op.h
|
while_op.cc
|
while_op.h
|
while_op_gpu.cc
|
workspace_ops.cc
|
zero_gradient_op.cc
|
zero_gradient_op.h
|
zero_gradient_op_gpu.cc
|