| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | /***************************************************************************************************
 | 
					
						
							| 
									
										
										
										
											2023-01-21 05:32:57 +08:00
										 |  |  |  * Copyright (c) 2017 - 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved. | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  |  * SPDX-License-Identifier: BSD-3-Clause | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |  * | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  |  * Redistribution and use in source and binary forms, with or without | 
					
						
							|  |  |  |  * modification, are permitted provided that the following conditions are met: | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |  * | 
					
						
							| 
									
										
										
										
											2022-04-24 03:02:38 +08:00
										 |  |  |  * 1. Redistributions of source code must retain the above copyright notice, this | 
					
						
							|  |  |  |  * list of conditions and the following disclaimer. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | 
					
						
							|  |  |  |  * this list of conditions and the following disclaimer in the documentation | 
					
						
							|  |  |  |  * and/or other materials provided with the distribution. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * 3. Neither the name of the copyright holder nor the names of its | 
					
						
							|  |  |  |  * contributors may be used to endorse or promote products derived from | 
					
						
							|  |  |  |  * this software without specific prior written permission. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | 
					
						
							|  |  |  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | 
					
						
							|  |  |  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE | 
					
						
							|  |  |  |  * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE | 
					
						
							|  |  |  |  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL | 
					
						
							|  |  |  |  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR | 
					
						
							|  |  |  |  * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER | 
					
						
							|  |  |  |  * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, | 
					
						
							|  |  |  |  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 
					
						
							|  |  |  |  * | 
					
						
							|  |  |  |  **************************************************************************************************/ | 
					
						
							|  |  |  | /* \file
 | 
					
						
							|  |  |  |    \brief Defines a math function | 
					
						
							|  |  |  | */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #pragma once
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | #include <vector>
 | 
					
						
							|  |  |  | #include <string>
 | 
					
						
							|  |  |  | #include <memory>
 | 
					
						
							|  |  |  | #include <unordered_map>
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // CUTLASS Library includes
 | 
					
						
							|  |  |  | #include "cutlass/library/library.h"
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | #include "cutlass/library/util.h"
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | #include "cutlass/library/manifest.h"
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // Profiler includes
 | 
					
						
							|  |  |  | #include "options.h"
 | 
					
						
							|  |  |  | #include "device_context.h"
 | 
					
						
							|  |  |  | #include "performance_result.h"
 | 
					
						
							|  |  |  | #include "performance_report.h"
 | 
					
						
							|  |  |  | #include "problem_space.h"
 | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  | #include "debug.h"
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | /////////////////////////////////////////////////////////////////////////////////////////////////
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | namespace cutlass { | 
					
						
							|  |  |  | namespace profiler { | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /////////////////////////////////////////////////////////////////////////////////////////////////
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /// Abstract base class for each math function
 | 
					
						
							|  |  |  | class OperationProfiler { | 
					
						
							|  |  |  | public: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | protected: | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  |   // Data members
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Top-level operation kind
 | 
					
						
							|  |  |  |   library::OperationKind kind_; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Human readable description
 | 
					
						
							|  |  |  |   std::string description_; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Arguments parsed from command line
 | 
					
						
							|  |  |  |   ArgumentDescriptionVector arguments_; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// List of providers used to verify and compare each result
 | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  |   ProviderVector verification_providers_; | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   /// Model performance result initailized by the operation profiler with workload statistics
 | 
					
						
							|  |  |  |   /// and reasonable default state.
 | 
					
						
							|  |  |  |   PerformanceResult model_result_; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Performance result vector constructed by profiling the operation
 | 
					
						
							|  |  |  |   PerformanceResultVector results_; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | public: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  |   // Methods
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Ctor
 | 
					
						
							|  |  |  |   OperationProfiler(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   OperationProfiler( | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  |     Options const &options, | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |     library::OperationKind kind,  | 
					
						
							|  |  |  |     ArgumentDescriptionVector const &arguments = ArgumentDescriptionVector(), | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  |     ProviderVector const & verification_providers = ProviderVector()); | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   /// Destructor
 | 
					
						
							|  |  |  |   virtual ~OperationProfiler(); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Obtains the operation kind
 | 
					
						
							|  |  |  |   library::OperationKind kind() const { return kind_; } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Gets the schema description
 | 
					
						
							|  |  |  |   std::string const &description() const; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Returns a reference to the arguments
 | 
					
						
							|  |  |  |   ArgumentDescriptionVector const &arguments() const { return arguments_; } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | public: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  |   // Basic overrides
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Prints usage statement for the math function
 | 
					
						
							|  |  |  |   virtual void print_usage(std::ostream &out) const; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Prints examples
 | 
					
						
							|  |  |  |   virtual void print_examples(std::ostream &out) const =0; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Entry point to profile all operations in the manifest
 | 
					
						
							|  |  |  |   virtual int profile_all( | 
					
						
							|  |  |  |     Options const &options,  | 
					
						
							|  |  |  |     library::Manifest const &manifest,  | 
					
						
							|  |  |  |     DeviceContext &device_context); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | public: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  |   // Operation-specific phases of verification and profiling
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Extracts the problem dimensions
 | 
					
						
							|  |  |  |   virtual Status initialize_configuration( | 
					
						
							|  |  |  |     Options const &options,  | 
					
						
							|  |  |  |     PerformanceReport &report,  | 
					
						
							|  |  |  |     DeviceContext &device_context, | 
					
						
							|  |  |  |     library::Operation const *operation, | 
					
						
							|  |  |  |     ProblemSpace const &problem_space, | 
					
						
							|  |  |  |     ProblemSpace::Problem const &problem) = 0; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Initializes workspace
 | 
					
						
							|  |  |  |   virtual Status initialize_workspace( | 
					
						
							|  |  |  |     Options const &options,  | 
					
						
							|  |  |  |     PerformanceReport &report,  | 
					
						
							|  |  |  |     DeviceContext &device_context, | 
					
						
							|  |  |  |     library::Operation const *operation, | 
					
						
							|  |  |  |     ProblemSpace const &problem_space, | 
					
						
							|  |  |  |     ProblemSpace::Problem const &problem) = 0; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Verifies CUTLASS against references
 | 
					
						
							|  |  |  |   virtual bool verify_cutlass( | 
					
						
							|  |  |  |     Options const &options,   | 
					
						
							|  |  |  |     PerformanceReport &report, | 
					
						
							|  |  |  |     DeviceContext &device_context, | 
					
						
							|  |  |  |     library::Operation const *operation, | 
					
						
							|  |  |  |     ProblemSpace const &problem_space, | 
					
						
							|  |  |  |     ProblemSpace::Problem const &problem) = 0; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Measures performance results
 | 
					
						
							|  |  |  |   virtual bool profile( | 
					
						
							|  |  |  |     Options const &options,   | 
					
						
							|  |  |  |     PerformanceReport &report, | 
					
						
							|  |  |  |     DeviceContext &device_context, | 
					
						
							|  |  |  |     library::Operation const *operation, | 
					
						
							|  |  |  |     ProblemSpace const &problem_space, | 
					
						
							|  |  |  |     ProblemSpace::Problem const &problem) = 0; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | public: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  |   // Static helpers
 | 
					
						
							|  |  |  |   //
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Sleep for a given duration in ms
 | 
					
						
							|  |  |  |   static void sleep(int sleep_duration); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Returns true if the current operation description satisfies the problem space
 | 
					
						
							|  |  |  |   static bool satisfies( | 
					
						
							|  |  |  |     library::OperationDescription const &op_desc, | 
					
						
							|  |  |  |     ProblemSpace const &problem_space, | 
					
						
							|  |  |  |     ProblemSpace::Problem const &problem); | 
					
						
							|  |  |  |    | 
					
						
							|  |  |  |   /// Compares tensors for equality
 | 
					
						
							|  |  |  |   static Disposition compare_tensors( | 
					
						
							|  |  |  |     Options const &options, | 
					
						
							|  |  |  |     DeviceAllocation &experimental, | 
					
						
							| 
									
										
										
										
											2020-09-24 05:00:58 +08:00
										 |  |  |     DeviceAllocation &reference, | 
					
						
							|  |  |  |     int64_t count = 0); | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |   static void save_workspace( | 
					
						
							|  |  |  |     DeviceContext &device_context, | 
					
						
							|  |  |  |     Options const &options, | 
					
						
							|  |  |  |     library::OperationDescription const &desc, | 
					
						
							| 
									
										
										
										
											2020-04-08 04:51:25 +08:00
										 |  |  |     library::Provider provider, | 
					
						
							|  |  |  |     library::Provider verification_provider = library::Provider::kInvalid); | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  |    | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   /// Helper to set a performance result member
 | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  |   static void set_argument(   | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |     PerformanceResult &result, | 
					
						
							|  |  |  |     char const *name, | 
					
						
							|  |  |  |     ProblemSpace const &problem_space, | 
					
						
							|  |  |  |     std::string const &value); | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Helper to set a performance result member
 | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  |   static void set_argument(   | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |     PerformanceResult &result, | 
					
						
							|  |  |  |     char const *name, | 
					
						
							|  |  |  |     ProblemSpace const &problem_space, | 
					
						
							|  |  |  |     int64_t value); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  | protected: | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |   /// Sets operation description 
 | 
					
						
							|  |  |  |   static void initialize_result_( | 
					
						
							|  |  |  |     PerformanceResult &result, | 
					
						
							|  |  |  |     library::OperationDescription const &operation_desc, | 
					
						
							|  |  |  |     ProblemSpace const &problem_space); | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |   /// Method to profile an initialized CUTLASS operation
 | 
					
						
							|  |  |  |   virtual Status profile_cutlass_( | 
					
						
							|  |  |  |     double &runtime, | 
					
						
							|  |  |  |     Options const &options, | 
					
						
							|  |  |  |     library::Operation const *operation, | 
					
						
							| 
									
										
										
										
											2020-09-24 05:00:58 +08:00
										 |  |  |     void *arguments, | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  |     void *host_workspace, | 
					
						
							|  |  |  |     void *device_workspace); | 
					
						
							| 
									
										
										
										
											2020-06-09 07:17:35 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | private: | 
					
						
							|  |  |  |   /// finds string matches filter_string in operation_name
 | 
					
						
							|  |  |  |   bool find_string_matches_( | 
					
						
							|  |  |  |     std::string const &filter_string,  | 
					
						
							|  |  |  |     std::string const &operation_name); | 
					
						
							| 
									
										
										
										
											2019-11-20 08:55:34 +08:00
										 |  |  | }; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /////////////////////////////////////////////////////////////////////////////////////////////////
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /// Vector of owning operation profilers
 | 
					
						
							|  |  |  | using OperationProfilerVector = std::vector<std::unique_ptr<OperationProfiler>>; | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /////////////////////////////////////////////////////////////////////////////////////////////////
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | } // namespace profiler
 | 
					
						
							|  |  |  | } // namespace cutlass
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | /////////////////////////////////////////////////////////////////////////////////////////////////
 |