Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
Expand Up @@ -404,7 +404,7 @@ struct Result {
out << "Name,";
}

out << "Layer,N,H,W,C,K,R,S,Runtime,GFLOPs";
out << "Layer,N,H,W,C,K,R,S,Runtime,GFLOPS";

return out;
}
Expand Down Expand Up @@ -662,7 +662,7 @@ Result profile_convolution(Options const &options) {
return result;
}

// Print average runtime and GFLOPs.
// Print average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down
4 changes: 2 additions & 2 deletions examples/10_planar_complex/planar_complex.cu
Original file line number Diff line number Diff line change
Expand Up @@ -416,7 +416,7 @@ public:
return result;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down Expand Up @@ -476,7 +476,7 @@ public:
}

std::cout << "Runtime: " << result.runtime_ms << " ms" << std::endl;
std::cout << " GFLOPs: " << result.gflops << std::endl;
std::cout << " GFLOPS: " << result.gflops << std::endl;

return result;
}
Expand Down
4 changes: 2 additions & 2 deletions examples/11_planar_complex_array/planar_complex_array.cu
Original file line number Diff line number Diff line change
Expand Up @@ -477,7 +477,7 @@ public:
return result;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down Expand Up @@ -537,7 +537,7 @@ public:
}

std::cout << "Runtime: " << result.runtime_ms << " ms" << std::endl;
std::cout << " GFLOPs: " << result.gflops << std::endl;
std::cout << " GFLOPS: " << result.gflops << std::endl;

return result;
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -369,7 +369,7 @@ int run(Options &options) {
return -1;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down Expand Up @@ -412,7 +412,7 @@ int run(Options &options) {

if (passed) {
std::cout << "Runtime: " << result.runtime_ms << " ms" << std::endl;
std::cout << " GFLOPs: " << result.gflops << std::endl;
std::cout << " GFLOPS: " << result.gflops << std::endl;
}

std::cout << (passed ? "Passed" : "Failed") << std::endl;
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -499,7 +499,7 @@ struct Result {
out << "Name,";
}

out << "Layer,N,H,W,C,K,R,S,Runtime,GFLOPs";
out << "Layer,N,H,W,C,K,R,S,Runtime,GFLOPS";

return out;
}
Expand Down
4 changes: 2 additions & 2 deletions examples/21_quaternion_gemm/quaternion_gemm.cu
Original file line number Diff line number Diff line change
Expand Up @@ -378,7 +378,7 @@ int run(Options options) {
return -1;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down Expand Up @@ -424,7 +424,7 @@ int run(Options options) {

if (passed) {
std::cout << "Runtime: " << result.runtime_ms << " ms" << std::endl;
std::cout << " GFLOPs: " << result.gflops << std::endl;
std::cout << " GFLOPS: " << result.gflops << std::endl;
}

std::cout << (passed ? "Passed" : "Failed") << std::endl;
Expand Down
4 changes: 2 additions & 2 deletions examples/22_quaternion_conv/quaternion_conv.cu
Original file line number Diff line number Diff line change
Expand Up @@ -321,7 +321,7 @@ struct Result {
out << "Name,";
}

out << "Layer,N,H,W,C,K,R,S,Runtime,GFLOPs";
out << "Layer,N,H,W,C,K,R,S,Runtime,GFLOPS";

return out;
}
Expand Down Expand Up @@ -577,7 +577,7 @@ Result profile_convolution(Options const &options) {
return result;
}

// Print average runtime and GFLOPs.
// Print average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -678,7 +678,7 @@ Result profile(Options const &options) {
return result;
}

// Print average runtime and GFLOPs.
// Print average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);

// Cleanup
Expand Down
10 changes: 5 additions & 5 deletions examples/24_gemm_grouped/gemm_grouped.cu
Original file line number Diff line number Diff line change
Expand Up @@ -268,7 +268,7 @@ struct Options {
output_file.open(output_path.c_str(), open_mode);

if (output_file.good() && open_mode != std::ios_base::app) {
output_file << "Tag,Provider,Kind,Groups,Runtime,GFLOPs\n";
output_file << "Tag,Provider,Kind,Groups,Runtime,GFLOPS\n";
}
}

Expand Down Expand Up @@ -1118,7 +1118,7 @@ public:
return result;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(this->options.iterations);
result.gflops = this->options.gflops(result.runtime_ms / 1000.0);

Expand All @@ -1139,7 +1139,7 @@ public:
std::cout << " " << this->options.problem_bins.size() << " batched GEMMs launched" << std::endl;
std::cout << std::endl;
std::cout << " " << "Batched Runtime: " << result.runtime_ms << " ms" << std::endl;
std::cout << " " << "Batched GFLOPs: " << result.gflops << std::endl;
std::cout << " " << "Batched GFLOPS: " << result.gflops << std::endl;

std::string provider = "CUTLASS";

Expand Down Expand Up @@ -1380,7 +1380,7 @@ public:
return result;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(this->options.iterations);
result.gflops = this->options.gflops(result.runtime_ms / 1000.0);

Expand Down Expand Up @@ -1413,7 +1413,7 @@ public:

std::cout << std::endl;
std::cout << " " << "Grouped Runtime: " << result.runtime_ms << " ms" << std::endl;
std::cout << " " << "Grouped GFLOPs: " << result.gflops << std::endl;
std::cout << " " << "Grouped GFLOPS: " << result.gflops << std::endl;
if (this->options.profile_initialization) {
std::cout << " " << "Init Runtime: " << result.initialization_time_ms << " ms" << std::endl;
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -347,7 +347,7 @@ struct Result {
out << "Name,";
}

out << "Layer,N,D,H,W,C,K,T,R,S,Stride_D,Stride_H,Stride_W,Runtime,GFLOPs";
out << "Layer,N,D,H,W,C,K,T,R,S,Stride_D,Stride_H,Stride_W,Runtime,GFLOPS";

return out;
}
Expand Down Expand Up @@ -659,7 +659,7 @@ Result profile_convolution(Options const &options) {
return result;
}

// Print average runtime and GFLOPs.
// Print average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -340,7 +340,7 @@ struct Result {
out << "Name,";
}

out << "Layer,N,H,W,C,K,R,S,Stride_H,Stride_W,Runtime,GFLOPs";
out << "Layer,N,H,W,C,K,R,S,Stride_H,Stride_W,Runtime,GFLOPS";

return out;
}
Expand Down Expand Up @@ -651,7 +651,7 @@ Result profile_convolution(Options const &options) {
return result;
}

// Print average runtime and GFLOPs.
// Print average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -337,7 +337,7 @@ struct Result {
out << "Name,";
}

out << "Layer,N,H,W,C,K,R,S,Stride_H,Stride_W,Runtime,GFLOPs";
out << "Layer,N,H,W,C,K,R,S,Stride_H,Stride_W,Runtime,GFLOPS";

return out;
}
Expand Down Expand Up @@ -649,7 +649,7 @@ Result profile_convolution(Options const &options) {
return result;
}

// Print average runtime and GFLOPs.
// Print average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -532,7 +532,7 @@ bool run(Options &options) {
return false;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.m = problem_size.m();
result.n = problem_size.n();
result.k = problem_size.k();
Expand Down Expand Up @@ -661,7 +661,7 @@ bool run(Options &options) {
std::cout.precision(4);
std::cout << "Runtime: " << result.runtime_ms << " ms" << std::endl;
std::cout.precision(2);
std::cout << "GFLOPs: " << result.gflops << std::endl;
std::cout << "GFLOPS: " << result.gflops << std::endl;
std::cout << "Normalized L2 norm of" << std::endl;
std::cout.precision(8);
std::cout << std::scientific
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -333,7 +333,7 @@ struct Result {
out << "Name,";
}

out << "Layer,N,H,W,C,K,R,S,Runtime,GFLOPs,3xTF32_vs_FP64,1xTF32_vs_FP64,FP32_vs_FP64";
out << "Layer,N,H,W,C,K,R,S,Runtime,GFLOPS,3xTF32_vs_FP64,1xTF32_vs_FP64,FP32_vs_FP64";

return out;
}
Expand Down Expand Up @@ -559,7 +559,7 @@ Result profile_convolution(Options const &options) {
return result;
}

// Print average runtime and GFLOPs.
// Print average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -472,7 +472,7 @@ bool run(Options &options) {
return false;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.m = problem_size.m();
result.n = problem_size.n();
result.k = problem_size.k();
Expand Down Expand Up @@ -603,7 +603,7 @@ bool run(Options &options) {
std::cout.precision(4);
std::cout << "Runtime: " << result.runtime_ms << " ms" << std::endl;
std::cout.precision(2);
std::cout << "GFLOPs: " << result.gflops << std::endl;
std::cout << "GFLOPS: " << result.gflops << std::endl;
std::cout << "Normalized L2 norm of" << std::endl;
std::cout.precision(8);
std::cout << std::scientific
Expand Down
4 changes: 2 additions & 2 deletions examples/30_wgrad_split_k/30_wgrad_split_k.cu
Original file line number Diff line number Diff line change
Expand Up @@ -364,7 +364,7 @@ struct Result {
out << "Name,";
}

out << "Layer,N,H,W,C,K,R,S,Stride_H,Stride_W,Runtime,GFLOPs";
out << "Layer,N,H,W,C,K,R,S,Stride_H,Stride_W,Runtime,GFLOPS";

return out;
}
Expand Down Expand Up @@ -674,7 +674,7 @@ Result profile_convolution(Options const &options) {
return result;
}

// Print average runtime and GFLOPs.
// Print average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down
4 changes: 2 additions & 2 deletions examples/34_transposed_conv2d/34_transposed_conv2d.cu
Original file line number Diff line number Diff line change
Expand Up @@ -302,7 +302,7 @@ struct Result {
out << "Name,";
}

out << "Layer,N,H,W,C,K,R,S,Stride_H,Stride_W,Runtime,GFLOPs";
out << "Layer,N,H,W,C,K,R,S,Stride_H,Stride_W,Runtime,GFLOPS";

return out;
}
Expand Down Expand Up @@ -574,7 +574,7 @@ Result profile_convolution(Options const &options) {
return result;
}

// Print average runtime and GFLOPs.
// Print average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand Down
2 changes: 1 addition & 1 deletion examples/35_gemm_softmax/gemm_softmax.cu
Original file line number Diff line number Diff line change
Expand Up @@ -675,7 +675,7 @@ struct Testbed {

std::cout << " Runtime: " << elapsed_ms_per_iter << " ms\n" << std::endl;

std::cout << " GFLOPs: " << gflops_per_second << " GFLOPs" << std::endl;
std::cout << " GFLOPS: " << gflops_per_second << " GFLOPS" << std::endl;
std::cout << "Memory bandwidth: " << gbytes_per_second << " GiB/s" << std::endl;

return true;
Expand Down
4 changes: 2 additions & 2 deletions examples/36_gather_scatter_fusion/gather_scatter_fusion.cu
Original file line number Diff line number Diff line change
Expand Up @@ -489,7 +489,7 @@ int run(Options &options) {
return -1;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(options.iterations);
result.gflops = options.gflops(result.runtime_ms / 1000.0);

Expand All @@ -499,7 +499,7 @@ int run(Options &options) {
}

std::cout << "Runtime: " << result.runtime_ms << " ms\n";
std::cout << " GFLOPs: " << result.gflops << "\n";
std::cout << " GFLOPS: " << result.gflops << "\n";

return 0;
}
Expand Down
2 changes: 1 addition & 1 deletion examples/37_gemm_layernorm_gemm_fusion/gemm_layernorm.cu
Original file line number Diff line number Diff line change
Expand Up @@ -885,7 +885,7 @@ struct Testbed {
<< std::endl;

std::cout << " Runtime / iteration: " << elapsed_ms_per_iter << " ms\n" << std::endl;
std::cout << " GFLOPs: " << gflops_per_second << " GFLOPs" << std::endl;
std::cout << " GFLOPS: " << gflops_per_second << " GFLOPS" << std::endl;

return true;
}
Expand Down
8 changes: 4 additions & 4 deletions examples/38_syr2k_grouped/syr2k_grouped.cu
Original file line number Diff line number Diff line change
Expand Up @@ -242,7 +242,7 @@ struct Options {
output_file.open(output_path.c_str(), open_mode);

if (output_file.good() && open_mode != std::ios_base::app) {
output_file << "Tag,Provider,Kind,Groups,Runtime,GFLOPs\n";
output_file << "Tag,Provider,Kind,Groups,Runtime,GFLOPS\n";
}
}

Expand Down Expand Up @@ -994,7 +994,7 @@ public:
return result;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(this->options.iterations);
result.gflops = this->options.gflops(result.runtime_ms / 1000.0);

Expand Down Expand Up @@ -1246,7 +1246,7 @@ public:
return result;
}

// Compute average runtime and GFLOPs.
// Compute average runtime and GFLOPS.
result.runtime_ms = double(runtime_ms) / double(this->options.iterations);
result.gflops = this->options.gflops(result.runtime_ms / 1000.0);

Expand Down Expand Up @@ -1279,7 +1279,7 @@ public:

std::cout << std::endl;
std::cout << " " << "Grouped Runtime: " << result.runtime_ms << " ms" << std::endl;
std::cout << " " << "Grouped GFLOPs: " << result.gflops << std::endl;
std::cout << " " << "Grouped GFLOPS: " << result.gflops << std::endl;
if (this->options.profile_initialization) {
std::cout << " " << "Init Runtime: " << result.initialization_time_ms << " ms" << std::endl;
}
Expand Down
Loading