1 /* -*- c++ -*- */
2 /*
3  * Copyright © 2020 Intel Corporation
4  *
5  * Permission is hereby granted, free of charge, to any person obtaining a
6  * copy of this software and associated documentation files (the "Software"),
7  * to deal in the Software without restriction, including without limitation
8  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9  * and/or sell copies of the Software, and to permit persons to whom the
10  * Software is furnished to do so, subject to the following conditions:
11  *
12  * The above copyright notice and this permission notice (including the next
13  * paragraph) shall be included in all copies or substantial portions of the
14  * Software.
15  *
16  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22  * IN THE SOFTWARE.
23  */
24 
25 #ifndef BRW_IR_PERFORMANCE_H
26 #define BRW_IR_PERFORMANCE_H
27 
28 class fs_visitor;
29 
30 namespace brw {
31    class vec4_visitor;
32 
33    /**
34     * Various estimates of the performance of a shader based on static
35     * analysis.
36     */
37    struct performance {
38       performance(const fs_visitor *v);
39       performance(const vec4_visitor *v);
40       ~performance();
41 
42       analysis_dependency_class
dependency_classperformance43       dependency_class() const
44       {
45          return (DEPENDENCY_INSTRUCTIONS |
46                  DEPENDENCY_BLOCKS);
47       }
48 
49       bool
validateperformance50       validate(const backend_shader *) const
51       {
52          return true;
53       }
54 
55       /**
56        * Array containing estimates of the runtime of each basic block of the
57        * program in cycle units.
58        */
59       unsigned *block_latency;
60 
61       /**
62        * Estimate of the runtime of the whole program in cycle units assuming
63        * uncontended execution.
64        */
65       unsigned latency;
66 
67       /**
68        * Estimate of the throughput of the whole program in
69        * invocations-per-cycle units.
70        *
71        * Note that this might be lower than the ratio between the dispatch
72        * width of the program and its latency estimate in cases where
73        * performance doesn't scale without limits as a function of its thread
74        * parallelism, e.g. due to the existence of a bottleneck in a shared
75        * function.
76        */
77       float throughput;
78 
79    private:
80       performance(const performance &perf);
81       performance &
82       operator=(performance u);
83    };
84 }
85 
86 #endif
87