Index of /rfdiffusion2/cutlass-3.5.1/test/unit/gemm/device/


../
CMakeLists.txt                                     20-Aug-2024 02:21               26389
default_gemm_configuration.hpp                     20-Aug-2024 02:21               53507
gemm_b1t_b1n_s32n_tensor_op_s32_sm75.cu            20-Aug-2024 02:21               10188
gemm_b1t_b1n_s32n_tensor_op_s32_sm80.cu            20-Aug-2024 02:21               33161
gemm_b1t_b1n_s32n_wmma_tensor_op_s32_sm75.cu       20-Aug-2024 02:21                8933
gemm_b1t_b1n_s32t_tensor_op_s32_sm75.cu            20-Aug-2024 02:21               10162
gemm_b1t_b1n_s32t_tensor_op_s32_sm80.cu            20-Aug-2024 02:21               17912
gemm_b1t_b1n_s32t_wmma_tensor_op_s32_sm75.cu       20-Aug-2024 02:21                8914
gemm_bf16n_bf16n_f32t_tensor_op_f32_sm80.cu        20-Aug-2024 02:21               16447
gemm_bf16t_bf16t_bf16t_tensor_op_f32_sm80.cu       20-Aug-2024 02:21               16575
gemm_cf32n_cf32t_cf32t_tensor_op_tf32_f32_sm80.cu  20-Aug-2024 02:21                8316
gemm_cf32t_cf32n_cf32t_tensor_op_tf32_f32_sm80.cu  20-Aug-2024 02:21                8314
gemm_cf64n_cf64t_cf64t_tensor_op_f64_gaussian_s..> 20-Aug-2024 02:21                6714
gemm_cf64n_cf64t_cf64t_tensor_op_f64_gaussian_s..> 20-Aug-2024 02:21                6746
gemm_cf64n_cf64t_cf64t_tensor_op_f64_sm80.cu       20-Aug-2024 02:21                7895
gemm_cf64n_cf64t_cf64t_tensor_op_f64_sm90.cu       20-Aug-2024 02:21                7929
gemm_cf64t_cf64n_cf64t_tensor_op_f64_gaussian_s..> 20-Aug-2024 02:21                6516
gemm_cf64t_cf64n_cf64t_tensor_op_f64_gaussian_s..> 20-Aug-2024 02:21                6548
gemm_cf64t_cf64n_cf64t_tensor_op_f64_sm80.cu       20-Aug-2024 02:21                9016
gemm_cf64t_cf64n_cf64t_tensor_op_f64_sm90.cu       20-Aug-2024 02:21                9051
gemm_f16n_f16n_f16n_direct_store_tensor_op_f32_..> 20-Aug-2024 02:21                4556
gemm_f16n_f16n_f16n_wmma_tensor_op_f16_sm70.cu     20-Aug-2024 02:21                6165
gemm_f16n_f16n_f16n_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21                6124
gemm_f16n_f16n_f16t_tensor_op_f32_sm75.cu          20-Aug-2024 02:21                9634
gemm_f16n_f16n_f16t_tensor_op_f32_sm80.cu          20-Aug-2024 02:21               16357
gemm_f16n_f16n_f16t_tensor_op_f32_sparse_sm80.cu   20-Aug-2024 02:21               13307
gemm_f16n_f16n_f16t_volta_tensor_op_f32_sm70.cu    20-Aug-2024 02:21                8845
gemm_f16n_f16n_f16t_wmma_tensor_op_f16_sm70.cu     20-Aug-2024 02:21               13583
gemm_f16n_f16n_f16t_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21               13464
gemm_f16n_f16n_f32n_tensor_op_f32_sm75.cu          20-Aug-2024 02:21                9571
gemm_f16n_f16n_f32n_tensor_op_f32_sm80.cu          20-Aug-2024 02:21               16239
gemm_f16n_f16n_f32n_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21                6140
gemm_f16n_f16n_f32t_tensor_op_f32_sm75.cu          20-Aug-2024 02:21                9544
gemm_f16n_f16n_f32t_tensor_op_f32_sm80.cu          20-Aug-2024 02:21               16417
gemm_f16n_f16n_f32t_tensor_op_f32_sparse_sm80.cu   20-Aug-2024 02:21               13193
gemm_f16n_f16n_f32t_volta_tensor_op_f32_sm70.cu    20-Aug-2024 02:21                8775
gemm_f16n_f16n_f32t_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21               11470
gemm_f16n_f16t_f16n_wmma_tensor_op_f16_sm70.cu     20-Aug-2024 02:21                6156
gemm_f16n_f16t_f16n_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21                6116
gemm_f16n_f16t_f16t_tensor_op_f16_slicedk_sm75.cu  20-Aug-2024 02:21                3528
gemm_f16n_f16t_f16t_tensor_op_f16_slicedk_sm80.cu  20-Aug-2024 02:21                3539
gemm_f16n_f16t_f16t_tensor_op_f16_sm75.cu          20-Aug-2024 02:21               15092
gemm_f16n_f16t_f16t_tensor_op_f16_sm80.cu          20-Aug-2024 02:21               16470
gemm_f16n_f16t_f16t_tensor_op_f16_sparse_sm80.cu   20-Aug-2024 02:21               13392
gemm_f16n_f16t_f16t_tensor_op_f32_sm80.cu          20-Aug-2024 02:21               13900
gemm_f16n_f16t_f16t_volta_tensor_op_f16_sm70.cu    20-Aug-2024 02:21                8608
gemm_f16n_f16t_f16t_wmma_tensor_op_f16_sm70.cu     20-Aug-2024 02:21               13518
gemm_f16n_f16t_f16t_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21                3645
gemm_f16n_f16t_f32n_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21                6096
gemm_f16n_f16t_f32t_tensor_op_f32_sm75.cu          20-Aug-2024 02:21                7845
gemm_f16n_f16t_f32t_tensor_op_f32_sm80.cu          20-Aug-2024 02:21               18135
gemm_f16n_f16t_f32t_tensor_op_f32_sparse_sm80.cu   20-Aug-2024 02:21               20134
gemm_f16n_f16t_f32t_volta_tensor_op_f32_sm70.cu    20-Aug-2024 02:21                8505
gemm_f16n_f16t_f32t_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21               11497
gemm_f16t_f16n_f16n_singlestage_wmma_tensor_op_..> 20-Aug-2024 02:21               11090
gemm_f16t_f16n_f16n_wmma_tensor_op_f16_sm70.cu     20-Aug-2024 02:21                6156
gemm_f16t_f16n_f16n_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21                6116
gemm_f16t_f16n_f16t_singlestage_wmma_tensor_op_..> 20-Aug-2024 02:21               11066
gemm_f16t_f16n_f16t_tensor_op_f16_broadcast_sm8..> 20-Aug-2024 02:21               17080
gemm_f16t_f16n_f16t_tensor_op_f16_slicedk_sm75.cu  20-Aug-2024 02:21                3528
gemm_f16t_f16n_f16t_tensor_op_f16_slicedk_sm80.cu  20-Aug-2024 02:21                3540
gemm_f16t_f16n_f16t_tensor_op_f16_sm75.cu          20-Aug-2024 02:21                7964
gemm_f16t_f16n_f16t_tensor_op_f16_sm80.cu          20-Aug-2024 02:21               16457
gemm_f16t_f16n_f16t_tensor_op_f16_sparse_sm80.cu   20-Aug-2024 02:21               13384
gemm_f16t_f16n_f16t_tensor_op_f32_sm75.cu          20-Aug-2024 02:21               12317
gemm_f16t_f16n_f16t_tensor_op_f32_sm80.cu          20-Aug-2024 02:21               27384
gemm_f16t_f16n_f16t_volta_tensor_op_f16_sm70.cu    20-Aug-2024 02:21                8933
gemm_f16t_f16n_f16t_wmma_tensor_op_f16_sm70.cu     20-Aug-2024 02:21               13551
gemm_f16t_f16n_f16t_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21               13540
gemm_f16t_f16n_f32n_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21                6130
gemm_f16t_f16n_f32t_singlestage_wmma_tensor_op_..> 20-Aug-2024 02:21                8160
gemm_f16t_f16n_f32t_tensor_op_f32_sm75.cu          20-Aug-2024 02:21                7847
gemm_f16t_f16n_f32t_tensor_op_f32_sm80.cu          20-Aug-2024 02:21               16131
gemm_f16t_f16n_f32t_tensor_op_f32_sparse_sm80.cu   20-Aug-2024 02:21               19262
gemm_f16t_f16n_f32t_volta_tensor_op_f32_sm70.cu    20-Aug-2024 02:21                8754
gemm_f16t_f16n_f32t_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21               11497
gemm_f16t_f16t_f16n_wmma_tensor_op_f16_sm70.cu     20-Aug-2024 02:21                6147
gemm_f16t_f16t_f16n_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21                6107
gemm_f16t_f16t_f16t_wmma_tensor_op_f16_sm70.cu     20-Aug-2024 02:21               13518
gemm_f16t_f16t_f16t_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21               13398
gemm_f16t_f16t_f32n_tensor_op_f32_sm75.cu          20-Aug-2024 02:21                7845
gemm_f16t_f16t_f32n_tensor_op_f32_sm80.cu          20-Aug-2024 02:21               16149
gemm_f16t_f16t_f32n_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21                6119
gemm_f16t_f16t_f32t_tensor_op_f32_sm75.cu          20-Aug-2024 02:21                7827
gemm_f16t_f16t_f32t_tensor_op_f32_sm80.cu          20-Aug-2024 02:21               16101
gemm_f16t_f16t_f32t_tensor_op_f32_sparse_sm80.cu   20-Aug-2024 02:21                9608
gemm_f16t_f16t_f32t_volta_tensor_op_f32_sm70.cu    20-Aug-2024 02:21                7898
gemm_f16t_f16t_f32t_wmma_tensor_op_f32_sm70.cu     20-Aug-2024 02:21               11470
gemm_f32n_f32n_f32t_tensor_op_bf16_f32_sm80.cu     20-Aug-2024 02:21                3584
gemm_f32n_f32n_f32t_tensor_op_f32_sm80.cu          20-Aug-2024 02:21                3473
gemm_f32n_f32n_f32t_tensor_op_f32_sparse_sm80.cu   20-Aug-2024 02:21               13085
gemm_f32n_f32t_f32t_tensor_op_f32_sparse_sm80.cu   20-Aug-2024 02:21               13914
gemm_f32t_f32n_f32t_tensor_op_f32_sparse_sm80.cu   20-Aug-2024 02:21               19104
gemm_f32t_f32t_f32t_tensor_op_f32_sparse_sm80.cu   20-Aug-2024 02:21               13013
gemm_f64n_f64t_f64t_tensor_op_f64_sm80.cu          20-Aug-2024 02:21                8349
gemm_f64n_f64t_f64t_tensor_op_f64_sm90.cu          20-Aug-2024 02:21                7299
gemm_f64t_f64n_f64t_tensor_op_f64_sm80.cu          20-Aug-2024 02:21                8348
gemm_f64t_f64n_f64t_tensor_op_f64_sm90.cu          20-Aug-2024 02:21                7290
gemm_f8t_f8n_f32t_tensor_op_f32_sm89.cu            20-Aug-2024 02:21                7093
gemm_f8t_f8n_f32t_tensor_op_f32_sparse_sm89.cu     20-Aug-2024 02:21                7252
gemm_f8t_f8n_f8t_tensor_op_f32_sm89.cu             20-Aug-2024 02:21               18766
gemm_f8t_f8n_f8t_tensor_op_f32_sparse_sm89.cu      20-Aug-2024 02:21               20564
gemm_grouped_scheduler_sm80.cu                     20-Aug-2024 02:21               10240
gemm_grouped_sm80.cu                               20-Aug-2024 02:21               26102
gemm_planar_complex_f16_f16_f32_tensor_op_sm70.cu  20-Aug-2024 02:21               11339
gemm_planar_complex_f16_f16_f32_tensor_op_sm75.cu  20-Aug-2024 02:21                7346
gemm_planar_complex_f16_f16_f32_tensor_op_sm80.cu  20-Aug-2024 02:21               12397
gemm_s4n_s4t_s4n_tensor_op_s32_sm75.cu             20-Aug-2024 02:21                6857
gemm_s4n_s4t_s4n_tensor_op_s32_sm80.cu             20-Aug-2024 02:21                7239
gemm_s4t_s4n_s32n_tensor_op_s32_sm75.cu            20-Aug-2024 02:21                8119
gemm_s4t_s4n_s32n_tensor_op_s32_sm80.cu            20-Aug-2024 02:21               16882
gemm_s4t_s4n_s32n_wmma_tensor_op_s32_sm75.cu       20-Aug-2024 02:21                8405
gemm_s4t_s4n_s32t_tensor_op_s32_sm75.cu            20-Aug-2024 02:21                8101
gemm_s4t_s4n_s32t_tensor_op_s32_sm80.cu            20-Aug-2024 02:21               17111
gemm_s4t_s4n_s32t_tensor_op_s32_sparse_sm80.cu     20-Aug-2024 02:21               21925
gemm_s4t_s4n_s32t_wmma_tensor_op_s32_sm75.cu       20-Aug-2024 02:21                8387
gemm_s4t_s4n_s4n_tensor_op_s32_sm75.cu             20-Aug-2024 02:21               10938
gemm_s4t_s4n_s4n_tensor_op_s32_sm80.cu             20-Aug-2024 02:21               18441
gemm_s4t_s4n_s4t_tensor_op_s32_sm75.cu             20-Aug-2024 02:21               17410
gemm_s4t_s4n_s4t_tensor_op_s32_sm80.cu             20-Aug-2024 02:21               33782
gemm_s8n_s8t_s8n_tensor_op_s32_sm75.cu             20-Aug-2024 02:21                9586
gemm_s8n_s8t_s8n_tensor_op_s32_sm80.cu             20-Aug-2024 02:21               11288
gemm_s8t_s8n_f16t_tensor_op_s32_sm80.cu            20-Aug-2024 02:21                3514
gemm_s8t_s8n_s32n_tensor_op_s32_sm75.cu            20-Aug-2024 02:21                7975
gemm_s8t_s8n_s32n_tensor_op_s32_sm80.cu            20-Aug-2024 02:21               16531
gemm_s8t_s8n_s32n_wmma_tensor_op_s32_sm72.cu       20-Aug-2024 02:21                5693
gemm_s8t_s8n_s32t_tensor_op_s32_sm75.cu            20-Aug-2024 02:21                7957
gemm_s8t_s8n_s32t_tensor_op_s32_sm80.cu            20-Aug-2024 02:21               16691
gemm_s8t_s8n_s32t_tensor_op_s32_sparse_sm80.cu     20-Aug-2024 02:21               21485
gemm_s8t_s8n_s32t_wmma_tensor_op_s32_sm72.cu       20-Aug-2024 02:21                6864
gemm_s8t_s8n_s8n_tensor_op_s32_sm75.cu             20-Aug-2024 02:21                8538
gemm_s8t_s8n_s8n_tensor_op_s32_sm80.cu             20-Aug-2024 02:21               18204
gemm_s8t_s8n_s8n_wmma_tensor_op_s32_sm72.cu        20-Aug-2024 02:21                6675
gemm_s8t_s8n_s8t_tensor_op_s32_sm75.cu             20-Aug-2024 02:21               18325
gemm_s8t_s8n_s8t_tensor_op_s32_sm80.cu             20-Aug-2024 02:21               43279
gemm_s8t_s8n_s8t_wmma_tensor_op_s32_sm72.cu        20-Aug-2024 02:21                6663
gemm_splitk_serial_tensor_op_sm75.cu               20-Aug-2024 02:21                4663
gemm_splitk_simt_sm50.cu                           20-Aug-2024 02:21                4945
gemm_splitk_tensor_op_sm70.cu                      20-Aug-2024 02:21                6616
gemm_splitk_tensor_op_sm75.cu                      20-Aug-2024 02:21               10581
gemm_testbed_3x.hpp                                20-Aug-2024 02:21               68444
gemm_testbed_3x_evt.hpp                            20-Aug-2024 02:21               47284
gemm_testbed_3x_ptr_array.hpp                      20-Aug-2024 02:21               68895
gemm_testbed_3x_tensor_broadcast.hpp               20-Aug-2024 02:21               20070
gemm_tf32n_tf32n_f32t_tensor_op_f32_sm80.cu        20-Aug-2024 02:21               16950
gemm_tf32n_tf32t_f32t_tensor_op_f32_sm80.cu        20-Aug-2024 02:21               16902
gemm_tf32t_tf32n_f32t_tensor_op_f32_sm80.cu        20-Aug-2024 02:21               15131
gemm_tf32t_tf32t_f32t_tensor_op_f32_sm80.cu        20-Aug-2024 02:21               16855
gemm_u8t_u8n_s32t_wmma_tensor_op_s32_sm72.cu       20-Aug-2024 02:21                6854
gemm_universal_bf16t_s8n_bf16t_mixed_input_tens..> 20-Aug-2024 02:21               10186
gemm_universal_bf16t_s8n_f32t_mixed_input_tenso..> 20-Aug-2024 02:21                3940
gemm_universal_bf16t_u8n_bf16t_mixed_input_tens..> 20-Aug-2024 02:21                3956
gemm_universal_bf16t_u8n_f32t_mixed_input_tenso..> 20-Aug-2024 02:21                3941
gemm_universal_cf32n_cf32n_cf32n_tensor_op_f32_..> 20-Aug-2024 02:21                6686
gemm_universal_cf64n_cf64t_cf64t_tensor_op_f64_..> 20-Aug-2024 02:21                6755
gemm_universal_cf64n_cf64t_cf64t_tensor_op_f64_..> 20-Aug-2024 02:21                6687
gemm_universal_f16n_f16t_f32n_tensor_op_f32_sm7..> 20-Aug-2024 02:21                4726
gemm_universal_f16n_f16t_f32t_tensor_op_f32_sm7..> 20-Aug-2024 02:21                4718
gemm_universal_f16t_s8n_f16t_mixed_input_tensor..> 20-Aug-2024 02:21                3955
gemm_universal_f16t_s8n_f16t_mixed_input_tensor..> 20-Aug-2024 02:21                3945
gemm_universal_f16t_s8n_f32t_mixed_input_tensor..> 20-Aug-2024 02:21                3935
gemm_universal_f16t_u8n_f16t_mixed_input_tensor..> 20-Aug-2024 02:21                3956
gemm_universal_f16t_u8n_f16t_mixed_input_tensor..> 20-Aug-2024 02:21                3946
gemm_universal_f16t_u8n_f32t_mixed_input_tensor..> 20-Aug-2024 02:21                3936
gemm_universal_s8t_bf16n_bf16t_mixed_input_tens..> 20-Aug-2024 02:21               13843
gemm_universal_s8t_bf16n_f32t_mixed_input_tenso..> 20-Aug-2024 02:21                3943
gemm_universal_s8t_f16n_f16t_mixed_input_tensor..> 20-Aug-2024 02:21                3958
gemm_universal_s8t_f16n_f16t_mixed_input_tensor..> 20-Aug-2024 02:21                3948
gemm_universal_s8t_f16n_f32t_mixed_input_tensor..> 20-Aug-2024 02:21                3938
gemm_universal_u8t_bf16n_bf16t_mixed_input_tens..> 20-Aug-2024 02:21                3959
gemm_universal_u8t_bf16n_f32t_mixed_input_tenso..> 20-Aug-2024 02:21                3944
gemm_universal_u8t_f16n_f16t_mixed_input_tensor..> 20-Aug-2024 02:21                3959
gemm_universal_u8t_f16n_f16t_mixed_input_tensor..> 20-Aug-2024 02:21                3949
gemm_universal_u8t_f16n_f32t_mixed_input_tensor..> 20-Aug-2024 02:21                3939
gemm_with_broadcast_f16n_f16n_f16n_tensorop_f32..> 20-Aug-2024 02:21               17827
gemm_with_reduction_f16n_f16n_f16n_tensorop_f32..> 20-Aug-2024 02:21               12841
gemm_with_reduction_f16t_f16n_f16n_tensorop_f32..> 20-Aug-2024 02:21                4544
gemv.cu                                            20-Aug-2024 02:21               17409
hemm_cf32h_cf32n_tensor_op_f32_ls_sm80.cu          20-Aug-2024 02:21                6028
hemm_cf32h_cf32n_tensor_op_f32_rs_sm80.cu          20-Aug-2024 02:21                6031
hemm_cf32h_cf32n_tensor_op_fast_f32_ls_sm80.cu     20-Aug-2024 02:21                6064
hemm_cf32h_cf32n_tensor_op_fast_f32_rs_sm80.cu     20-Aug-2024 02:21                6067
hemm_cf64_cf64_cf64_tensor_op_f64_sm90.cu          20-Aug-2024 02:21                4908
hemm_cf64h_cf64n_cf64n_tensor_op_ls_f64_gaussia..> 20-Aug-2024 02:21                6088
hemm_cf64h_cf64n_cf64n_tensor_op_ls_f64_sm80.cu    20-Aug-2024 02:21                6037
hemm_cf64h_cf64n_cf64n_tensor_op_rs_f64_sm80.cu    20-Aug-2024 02:21                6040
her2k_cf32h_cf32n_tensor_op_f32_sm80.cu            20-Aug-2024 02:21                5382
her2k_cf32h_cf32n_tensor_op_fast_f32_sm80.cu       20-Aug-2024 02:21                5406
her2k_cf64_cf64_tensor_op_f64_sm90.cu              20-Aug-2024 02:21                5401
her2k_cf64h_cf64n_tensor_op_f64_grouped_sm80.cu    20-Aug-2024 02:21               13055
her2k_cf64n_cf64n_tensor_op_f64_grouped_sm80.cu    20-Aug-2024 02:21               13027
her2k_cf64n_cf64n_tensor_op_f64_sm80.cu            20-Aug-2024 02:21                5388
her2k_cf64n_cf64t_tensor_op_f64_sm80.cu            20-Aug-2024 02:21                6939
herk_cf32h_cf32n_tensor_op_f32_sm80.cu             20-Aug-2024 02:21                7677
herk_cf32h_cf32n_tensor_op_fast_f32_sm80.cu        20-Aug-2024 02:21                7725
herk_cf64_cf64_tensor_op_f64_sm90.cu               20-Aug-2024 02:21                3853
herk_cf64h_cf64n_tensor_op_f64_sm80.cu             20-Aug-2024 02:21                6396
multistage_testbed.h                               20-Aug-2024 02:21               10129
multistage_testbed_interleaved.h                   20-Aug-2024 02:21               10270
rank_2k_grouped_scheduler_sm80.cu                  20-Aug-2024 02:21               11186
simt_cgemm_nn_sm50.cu                              20-Aug-2024 02:21               46795
simt_cgemm_nt_sm50.cu                              20-Aug-2024 02:21               54085
simt_cgemm_nt_sm80.cu                              20-Aug-2024 02:21                8318
simt_cgemm_tn_sm50.cu                              20-Aug-2024 02:21               46687
simt_cgemm_tn_sm80.cu                              20-Aug-2024 02:21                8411
simt_cgemm_tt_sm50.cu                              20-Aug-2024 02:21               46578
simt_dgemm_nn_sm50.cu                              20-Aug-2024 02:21               40533
simt_dgemm_nt_sm50.cu                              20-Aug-2024 02:21               47656
simt_dgemm_tn_sm50.cu                              20-Aug-2024 02:21               40441
simt_dgemm_tt_sm50.cu                              20-Aug-2024 02:21               40354
simt_f8gemm_tn_sm50.cu                             20-Aug-2024 02:21                3513
simt_hgemm_nn_sm50.cu                              20-Aug-2024 02:21               89517
simt_hgemm_nt_sm50.cu                              20-Aug-2024 02:21               89304
simt_hgemm_tn_sm50.cu                              20-Aug-2024 02:21               89304
simt_hgemm_tt_sm50.cu                              20-Aug-2024 02:21               89091
simt_igemm_nn_sm50.cu                              20-Aug-2024 02:21               69175
simt_igemm_nt_sm50.cu                              20-Aug-2024 02:21               71438
simt_igemm_tn_sm50.cu                              20-Aug-2024 02:21               67796
simt_igemm_tt_sm50.cu                              20-Aug-2024 02:21               70056
simt_int8_igemm_sm61.cu                            20-Aug-2024 02:21                7156
simt_int8_igemm_sm61_perf.cu                       20-Aug-2024 02:21                6067
simt_int8_igemm_sm61_sliced_k.cu                   20-Aug-2024 02:21                9063
simt_qgemm_nn_sm50.cu                              20-Aug-2024 02:21               35894
simt_qgemm_nt_sm50.cu                              20-Aug-2024 02:21               35813
simt_qgemm_tn_sm50.cu                              20-Aug-2024 02:21               35813
simt_qgemm_tt_sm50.cu                              20-Aug-2024 02:21               35732
simt_sgemm_nn_sm50.cu                              20-Aug-2024 02:21               70872
simt_sgemm_nt_sm50.cu                              20-Aug-2024 02:21               73136
simt_sgemm_nt_sm80.cu                              20-Aug-2024 02:21                8870
simt_sgemm_tn_sm50.cu                              20-Aug-2024 02:21               69488
simt_sgemm_tn_sm80.cu                              20-Aug-2024 02:21                8865
simt_sgemm_tt_sm50.cu                              20-Aug-2024 02:21               71755
simt_sm50.py                                       20-Aug-2024 02:21               17045
simt_zgemm_nn_sm50.cu                              20-Aug-2024 02:21               33231
simt_zgemm_nt_sm50.cu                              20-Aug-2024 02:21               33156
simt_zgemm_tn_sm50.cu                              20-Aug-2024 02:21               33156
simt_zgemm_tt_sm50.cu                              20-Aug-2024 02:21               33081
sm50_gemm_f32_f32_f32_simt.cu                      20-Aug-2024 02:21                5238
sm50_gemm_f64_f64_f64_simt.cu                      20-Aug-2024 02:21                5253
sm61_gemm_s8_s8_s32_simt.cu                        20-Aug-2024 02:21                5357
sm80_gemm_f16_f16_f32_tensor_op_f32.cu             20-Aug-2024 02:21                5479
sm80_gemm_f32_f32_f32_simt.cu                      20-Aug-2024 02:21                5238
sm80_gemm_f64_f64_f64_simt.cu                      20-Aug-2024 02:21                5253
sm80_gemm_f64_f64_f64_tensor_op_f64.cu             20-Aug-2024 02:21                3875
sm80_gemm_s8_s8_s32_tensor_op.cu                   20-Aug-2024 02:21                3734
sm80_gemm_tf32_tf32_f32_tensor_op_f32.cu           20-Aug-2024 02:21                6264
sm90_evt_operations.hpp                            20-Aug-2024 02:21               19334
sm90_gemm_bf16_bf16_bf16_alignx_tensor_op_f32.cu   20-Aug-2024 02:21                5474
sm90_gemm_bf16_bf16_bf16_alignx_tensor_op_f32_w..> 20-Aug-2024 02:21                6888
sm90_gemm_bf16_bf16_bf16_alignx_tensor_op_f32_w..> 20-Aug-2024 02:21                6966
sm90_gemm_bf16_bf16_bf16_alignx_tensor_op_f32_w..> 20-Aug-2024 02:21                6939
sm90_gemm_bf16_bf16_bf16_tensor_op_f32.cu          20-Aug-2024 02:21                8187
sm90_gemm_f16_f16_f16_alignx_tensor_op_f32.cu      20-Aug-2024 02:21               14314
sm90_gemm_f16_f16_f16_alignx_tensor_op_f32_warp..> 20-Aug-2024 02:21               19733
sm90_gemm_f16_f16_f16_alignx_tensor_op_f32_warp..> 20-Aug-2024 02:21               20045
sm90_gemm_f16_f16_f16_alignx_tensor_op_f32_warp..> 20-Aug-2024 02:21               19937
sm90_gemm_f16_f16_f16_tensor_op.cu                 20-Aug-2024 02:21               34699
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_uns..> 20-Aug-2024 02:21               25032
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21               25544
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21               35857
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21                9672
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21               29418
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21               24553
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21                7283
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21                8513
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21                6899
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21               53256
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21                9603
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21               20429
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21                7252
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21                8467
sm90_gemm_f16_f16_f16_tensor_op_f32_cluster_war..> 20-Aug-2024 02:21                6868
sm90_gemm_f16_f16_f16_tensor_op_f32_cooperative..> 20-Aug-2024 02:21               40354
sm90_gemm_f16_f16_f16_tensor_op_f32_group_gemm.cu  20-Aug-2024 02:21                6199
sm90_gemm_f16_f16_f16_tensor_op_f32_ptr_array.cu   20-Aug-2024 02:21                9630
sm90_gemm_f16_f16_f16_tensor_op_f32_tensor_broa..> 20-Aug-2024 02:21               11938
sm90_gemm_f16_f16_f32_tensor_op_f32_rs_cluster_..> 20-Aug-2024 02:21                9732
sm90_gemm_f32_f32_f32_tensor_op_f32.cu             20-Aug-2024 02:21                8365
sm90_gemm_f32_f32_f32_tensor_op_f32_tensor_broa..> 20-Aug-2024 02:21                6382
sm90_gemm_f8_f8_bf16_tensor_op_fp32.cu             20-Aug-2024 02:21               22739
sm90_gemm_f8_f8_bf16_tensor_op_fp32_evt.cu         20-Aug-2024 02:21                8472
sm90_gemm_f8_f8_f32_tensor_op_f32_cluster_warps..> 20-Aug-2024 02:21               22313
sm90_gemm_f8_f8_f32_tensor_op_f32_cluster_warps..> 20-Aug-2024 02:21                8418
sm90_gemm_f8_f8_f32_tensor_op_f32_cooperative_s..> 20-Aug-2024 02:21               23697
sm90_gemm_f8_f8_f32_tensor_op_f32_rs_cluster_wa..> 20-Aug-2024 02:21                9764
sm90_gemm_f8_f8_f32_tensor_op_fp32.cu              20-Aug-2024 02:21               22879
sm90_gemm_f8_f8_f8_tensor_op_fp32.cu               20-Aug-2024 02:21               54394
sm90_gemm_f8_f8_f8_tensor_op_fp32_evt.cu           20-Aug-2024 02:21                8504
sm90_gemm_s8_s8_s8_alignx_tensor_op_s32.cu         20-Aug-2024 02:21                5295
sm90_gemm_s8_s8_s8_alignx_tensor_op_s32_warpspe..> 20-Aug-2024 02:21                6593
sm90_gemm_s8_s8_s8_alignx_tensor_op_s32_warpspe..> 20-Aug-2024 02:21                6662
sm90_gemm_s8_s8_s8_alignx_tensor_op_s32_warpspe..> 20-Aug-2024 02:21                6644
sm90_gemm_s8_s8_s8_tensor_op_s32.cu                20-Aug-2024 02:21               15791
sm90_gemm_s8_s8_s8_tensor_op_s32_tensor_broadca..> 20-Aug-2024 02:21                4566
sm90_gemm_stream_k_scheduler.cu                    20-Aug-2024 02:21               12733
sm90_gemm_tf32_tf32_f32_alignx_tensor_op_f32.cu    20-Aug-2024 02:21                5297
sm90_gemm_tf32_tf32_f32_alignx_tensor_op_f32_wa..> 20-Aug-2024 02:21                6590
sm90_gemm_tf32_tf32_f32_alignx_tensor_op_f32_wa..> 20-Aug-2024 02:21                6659
sm90_gemm_tf32_tf32_f32_alignx_tensor_op_f32_wa..> 20-Aug-2024 02:21                6641
sm90_gemm_tf32_tf32_f32_tensor_op_f32.cu           20-Aug-2024 02:21                7972
sm90_gemm_tf32_tf32_f32_tensor_op_f32_gmma_rs_c..> 20-Aug-2024 02:21               21505
symm_cf32n_cf32n_tensor_op_f32_ls_sm80.cu          20-Aug-2024 02:21                5923
symm_cf32n_cf32n_tensor_op_f32_rs_sm80.cu          20-Aug-2024 02:21                5926
symm_cf32n_cf32n_tensor_op_fast_f32_ls_sm80.cu     20-Aug-2024 02:21                5959
symm_cf32n_cf32n_tensor_op_fast_f32_rs_sm80.cu     20-Aug-2024 02:21                5962
symm_cf64_cf64_cf64_tensor_op_f64_sm90.cu          20-Aug-2024 02:21                4838
symm_cf64n_cf64n_cf64n_tensor_op_ls_f64_gaussia..> 20-Aug-2024 02:21                5983
symm_cf64n_cf64n_cf64n_tensor_op_ls_f64_sm80.cu    20-Aug-2024 02:21                5932
symm_cf64n_cf64n_cf64n_tensor_op_rs_f64_sm80.cu    20-Aug-2024 02:21                5935
symm_f32n_f32n_tensor_op_fast_f32_ls_sm80.cu       20-Aug-2024 02:21               15203
symm_f32n_f32n_tensor_op_fast_f32_rs_sm80.cu       20-Aug-2024 02:21                8623
symm_f32t_f32t_tensor_op_fast_f32_ls_sm80.cu       20-Aug-2024 02:21               15104
symm_f64_f64_tensor_op_f64_sm90.cu                 20-Aug-2024 02:21                4777
symm_f64n_f64n_tensor_op_f64_ls_sm80.cu            20-Aug-2024 02:21                8103
symm_f64n_f64n_tensor_op_f64_rs_sm80.cu            20-Aug-2024 02:21                8108
symm_f64n_f64t_tensor_op_f64_ls_sm80.cu            20-Aug-2024 02:21                8088
symm_f64n_f64t_tensor_op_f64_rs_sm80.cu            20-Aug-2024 02:21                8093
symm_f64t_f64n_tensor_op_f64_ls_sm80.cu            20-Aug-2024 02:21                8073
symm_f64t_f64n_tensor_op_f64_rs_sm80.cu            20-Aug-2024 02:21                8078
symm_f64t_f64t_tensor_op_f64_ls_sm80.cu            20-Aug-2024 02:21                8058
symm_f64t_f64t_tensor_op_f64_rs_sm80.cu            20-Aug-2024 02:21                8063
symm_tf32n_f32n_tensor_op_f32_ls_sm80.cu           20-Aug-2024 02:21               15071
symm_tf32n_f32n_tensor_op_f32_rs_sm80.cu           20-Aug-2024 02:21                8551
symm_tf32t_f32t_tensor_op_f32_ls_sm80.cu           20-Aug-2024 02:21               14972
syr2k_cf32n_cf32n_tensor_op_f32_sm80.cu            20-Aug-2024 02:21                5362
syr2k_cf32n_cf32n_tensor_op_fast_f32_sm80.cu       20-Aug-2024 02:21                5386
syr2k_cf32n_cf32t_tensor_op_f32_sm80.cu            20-Aug-2024 02:21                5432
syr2k_cf32n_cf32t_tensor_op_fast_f32_sm80.cu       20-Aug-2024 02:21                5456
syr2k_cf64_cf64_tensor_op_f64_sm90.cu              20-Aug-2024 02:21                5378
syr2k_cf64n_cf64n_tensor_op_f64_grouped_sm80.cu    20-Aug-2024 02:21               12952
syr2k_cf64n_cf64n_tensor_op_f64_sm80.cu            20-Aug-2024 02:21                5444
syr2k_cf64n_cf64t_tensor_op_f64_grouped_sm80.cu    20-Aug-2024 02:21                7208
syr2k_cf64n_cf64t_tensor_op_f64_sm80.cu            20-Aug-2024 02:21                5362
syr2k_cf64t_cf64n_tensor_op_f64_grouped_sm80.cu    20-Aug-2024 02:21                7199
syr2k_cf64t_cf64t_tensor_op_f64_grouped_sm80.cu    20-Aug-2024 02:21                7190
syr2k_f32n_f32n_tensor_op_fast_f32_sm80.cu         20-Aug-2024 02:21                4794
syr2k_f32t_f32n_tensor_op_fast_f32_sm80.cu         20-Aug-2024 02:21                4783
syr2k_f64_f64_tensor_op_f64_sm90.cu                20-Aug-2024 02:21                4739
syr2k_f64n_f64n_tensor_op_f64_grouped_sm80.cu      20-Aug-2024 02:21               19145
syr2k_f64n_f64n_tensor_op_f64_sm80.cu              20-Aug-2024 02:21                7991
syr2k_f64n_f64t_tensor_op_f64_grouped_sm80.cu      20-Aug-2024 02:21               11015
syr2k_f64n_f64t_tensor_op_f64_sm80.cu              20-Aug-2024 02:21                7976
syr2k_f64t_f64n_tensor_op_f64_grouped_sm80.cu      20-Aug-2024 02:21               12342
syr2k_f64t_f64n_tensor_op_f64_sm80.cu              20-Aug-2024 02:21                7961
syr2k_f64t_f64t_tensor_op_f64_grouped_sm80.cu      20-Aug-2024 02:21               12321
syr2k_tf32n_f32n_tensor_op_f32_sm80.cu             20-Aug-2024 02:21                4786
syr2k_tf32t_f32n_tensor_op_f32_sm80.cu             20-Aug-2024 02:21                4775
syrk_cf32n_cf32n_tensor_op_f32_sm80.cu             20-Aug-2024 02:21                4993
syrk_cf32n_cf32n_tensor_op_fast_f32_sm80.cu        20-Aug-2024 02:21                5017
syrk_cf32n_cf32t_tensor_op_f32_sm80.cu             20-Aug-2024 02:21                4987
syrk_cf32n_cf32t_tensor_op_fast_f32_sm80.cu        20-Aug-2024 02:21                5011
syrk_cf64_cf64_tensor_op_f64_sm90.cu               20-Aug-2024 02:21                5023
syrk_cf64n_cf64n_tensor_op_f64_sm80.cu             20-Aug-2024 02:21                4996
syrk_cf64n_cf64t_tensor_op_f64_gaussian_sm80.cu    20-Aug-2024 02:21                3793
syrk_cf64n_cf64t_tensor_op_f64_sm80.cu             20-Aug-2024 02:21                4990
syrk_f32n_f32t_tensor_op_fast_f32_sm80.cu          20-Aug-2024 02:21               16084
syrk_f32t_f32t_tensor_op_fast_f32_sm80.cu          20-Aug-2024 02:21               16042
syrk_f64_f64_tensor_op_f64_sm90.cu                 20-Aug-2024 02:21                4529
syrk_f64n_f64t_tensor_op_f64_sm80.cu               20-Aug-2024 02:21                7451
syrk_f64t_f64n_tensor_op_f64_sm80.cu               20-Aug-2024 02:21                9401
syrk_tf32n_f32t_tensor_op_f32_sm80.cu              20-Aug-2024 02:21               16028
syrk_tf32t_f32t_tensor_op_f32_sm80.cu              20-Aug-2024 02:21               15986
testbed.h                                          20-Aug-2024 02:21               20429
testbed_complex.h                                  20-Aug-2024 02:21                8262
testbed_gemm_with_broadcast.h                      20-Aug-2024 02:21               20929
testbed_gemm_with_reduction.h                      20-Aug-2024 02:21               19443
testbed_grouped.h                                  20-Aug-2024 02:21               16502
testbed_grouped_rank_2k.h                          20-Aug-2024 02:21               16562
testbed_grouped_rank_2k_scheduler.h                20-Aug-2024 02:21               17002
testbed_grouped_scheduler.h                        20-Aug-2024 02:21               14698
testbed_interleaved.h                              20-Aug-2024 02:21               10226
testbed_planar_complex.h                           20-Aug-2024 02:21                9479
testbed_rank2k_universal.h                         20-Aug-2024 02:21               20896
testbed_rank_k_universal.h                         20-Aug-2024 02:21               15650
testbed_sanity.h                                   20-Aug-2024 02:21                8639
testbed_sparse.h                                   20-Aug-2024 02:21               16068
testbed_splitk.h                                   20-Aug-2024 02:21                6122
testbed_symm_universal.h                           20-Aug-2024 02:21               19991
testbed_trmm_universal.h                           20-Aug-2024 02:21               20228
testbed_universal.h                                20-Aug-2024 02:21               17969
testbed_utils.h                                    20-Aug-2024 02:21                2626
testbed_with_absmax.h                              20-Aug-2024 02:21               22501
trmm_cf32n_cf32n_cf32t_tensor_op_f32_sm80.cu       20-Aug-2024 02:21                9916
trmm_cf32n_cf32n_cf32t_tensor_op_fast_f32_sm80.cu  20-Aug-2024 02:21                9988
trmm_cf64_cf64_cf64_tensor_op_f64_sm90.cu          20-Aug-2024 02:21                4988
trmm_cf64n_cf64n_cf64t_tensor_op_f64_gaussian_s..> 20-Aug-2024 02:21                4992
trmm_cf64n_cf64n_cf64t_tensor_op_f64_sm80.cu       20-Aug-2024 02:21                9762
trmm_f32n_f32t_f32t_tensor_op_fast_f32_ls_sm80.cu  20-Aug-2024 02:21               15614
trmm_f32n_f32t_f32t_tensor_op_fast_f32_rs_sm80.cu  20-Aug-2024 02:21                8733
trmm_f32t_f32n_f32n_tensor_op_fast_f32_ls_sm80.cu  20-Aug-2024 02:21               14089
trmm_f32t_f32n_f32t_tensor_op_fast_f32_ls_sm80.cu  20-Aug-2024 02:21               14444
trmm_f64_f64_f64_tensor_op_f64_sm90.cu             20-Aug-2024 02:21                4607
trmm_f64n_f64n_f64t_tensor_op_f64_ls_sm80.cu       20-Aug-2024 02:21               12798
trmm_f64n_f64n_f64t_tensor_op_f64_rs_sm80.cu       20-Aug-2024 02:21               12809
trmm_f64n_f64t_f64t_tensor_op_f64_rs_sm80.cu       20-Aug-2024 02:21               12764
trmm_f64t_f64t_f64n_tensor_op_f64_ls_sm80.cu       20-Aug-2024 02:21               12768
trmm_f64t_f64t_f64n_tensor_op_f64_rs_sm80.cu       20-Aug-2024 02:21               12779
trmm_tf32n_tf32t_f32t_tensor_op_f32_ls_sm80.cu     20-Aug-2024 02:21               15504
trmm_tf32n_tf32t_f32t_tensor_op_f32_rs_sm80.cu     20-Aug-2024 02:21                8673
trmm_tf32t_tf32n_f32n_tensor_op_f32_ls_sm80.cu     20-Aug-2024 02:21               13989
trmm_tf32t_tf32n_f32t_tensor_op_f32_ls_sm80.cu     20-Aug-2024 02:21               14520