📄 ssyrk.cu
字号:
#define USE_MIXED_STEPPER 0#define FAST_IMUL 0#define UPPER 1#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void ssyrk_lo_nt_main_hw (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 0#define USE_MIXED_STEPPER 0#define FAST_IMUL 0#define UPPER 0#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void fast_ssyrk_up_tr_main_sw (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 0#define USE_MIXED_STEPPER 1#define FAST_IMUL 1#define UPPER 1#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void fast_ssyrk_lo_tr_main_sw (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 0#define USE_MIXED_STEPPER 1#define FAST_IMUL 1#define UPPER 0#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void fast_ssyrk_up_nt_main_sw (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 0#define USE_MIXED_STEPPER 1#define FAST_IMUL 1#define UPPER 1#define TRANSA 0#define TRANSB 1#include "ssyrk.h"} __global__ void fast_ssyrk_lo_nt_main_sw (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 0#define USE_MIXED_STEPPER 1#define FAST_IMUL 1#define UPPER 0#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void fast_ssyrk_up_tr_main_hw (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 0#define USE_MIXED_STEPPER 0#define FAST_IMUL 1#define UPPER 1#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void fast_ssyrk_lo_tr_main_hw (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 0#define USE_MIXED_STEPPER 0#define FAST_IMUL 1#define UPPER 0#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void fast_ssyrk_up_nt_main_hw (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 0#define USE_MIXED_STEPPER 0#define FAST_IMUL 1#define UPPER 1#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void fast_ssyrk_lo_nt_main_hw (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 0#define USE_MIXED_STEPPER 0#define FAST_IMUL 1#define UPPER 0#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void ssyrk_up_tr_main_sw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 1#define FAST_IMUL 0#define UPPER 1#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void ssyrk_lo_tr_main_sw_fulltile (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 1#define FAST_IMUL 0#define UPPER 0#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void ssyrk_up_nt_main_sw_fulltile (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 1#define FAST_IMUL 0#define UPPER 1#define TRANSA 0#define TRANSB 1#include "ssyrk.h"} __global__ void ssyrk_lo_nt_main_sw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 1#define FAST_IMUL 0#define UPPER 0#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void ssyrk_up_tr_main_hw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 0#define FAST_IMUL 0#define UPPER 1#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void ssyrk_lo_tr_main_hw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 0#define FAST_IMUL 0#define UPPER 0#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void ssyrk_up_nt_main_hw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 0#define FAST_IMUL 0#define UPPER 1#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void ssyrk_lo_nt_main_hw_fulltile (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 0#define FAST_IMUL 0#define UPPER 0#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void fast_ssyrk_up_tr_main_sw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 1#define FAST_IMUL 1#define UPPER 1#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void fast_ssyrk_lo_tr_main_sw_fulltile (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 1#define FAST_IMUL 1#define UPPER 0#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void fast_ssyrk_up_nt_main_sw_fulltile (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 1#define FAST_IMUL 1#define UPPER 1#define TRANSA 0#define TRANSB 1#include "ssyrk.h"} __global__ void fast_ssyrk_lo_nt_main_sw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 1#define FAST_IMUL 1#define UPPER 0#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void fast_ssyrk_up_tr_main_hw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 0#define FAST_IMUL 1#define UPPER 1#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void fast_ssyrk_lo_tr_main_hw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 0#define FAST_IMUL 1#define UPPER 0#define TRANSA 1#define TRANSB 0#include "ssyrk.h"}__global__ void fast_ssyrk_up_nt_main_hw_fulltile (struct cublasSsyrkParams parms) {#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 0#define FAST_IMUL 1#define UPPER 1#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}__global__ void fast_ssyrk_lo_nt_main_hw_fulltile (struct cublasSsyrkParams parms){#undef FULL_TILES_ONLY#undef USE_MIXED_STEPPER#undef FAST_IMUL#undef UPPER#undef TRANSA#undef TRANSB#define FULL_TILES_ONLY 1#define USE_MIXED_STEPPER 0#define FAST_IMUL 1#define UPPER 0#define TRANSA 0#define TRANSB 1#include "ssyrk.h"}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -