generated from taichi-dev/voxel-challenge
-
Notifications
You must be signed in to change notification settings - Fork 0
/
profile.log
172 lines (172 loc) · 13.4 KB
/
profile.log
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
[Profiler thread 17876]
42.749 s compile [32 x 1.336 s]
41.759 s 97.68% compile_to_executable [2 x 20.880 s]
37.938 s 90.85% compile_to_offloads [2 x 18.969 s]
0.001 s 0.00% frontend_type_check [2 x 562.000 us]
2.727 s 7.19% lower_ast [2 x 1.363 s]
2.392 s 87.72% replace_all_usages_with [24557 x 97.400 us]
0.335 s 12.28% [unaccounted]
0.004 s 0.01% lower_matrix_ptr [2 x 1.765 ms]
0.017 s 0.04% type_check [2 x 8.416 ms]
0.126 s 0.33% verify [14 x 9.011 ms]
34.743 s 91.58% full_simplify [6 x 5.791 s]
0.082 s 0.24% extract_constant [21 x 3.912 ms]
0.004 s 0.01% unreachable_code_elimination [21 x 203.619 us]
0.011 s 0.03% binary_op_simplify [21 x 511.952 us]
1.755 ms 16.32% replace_all_usages_with [44 x 39.886 us]
8.996 ms 83.68% [unaccounted]
0.492 s 1.42% constant_fold [21 x 23.425 ms]
317.903 ms 64.62% replace_all_usages_with [1563 x 203.393 us]
12.091 ms 2.46% compile [6 x 2.015 ms]
0.792 ms 6.55% compile_to_executable [6 x 132.000 us]
405.000 us 51.14% compile_to_offloads [6 x 67.500 us]
9.000 us 2.22% frontend_type_check [6 x 1.500 us]
18.000 us 4.44% lower_ast [6 x 3.000 us]
14.000 us 3.46% lower_matrix_ptr [6 x 2.333 us]
20.000 us 4.94% type_check [6 x 3.333 us]
37.000 us 9.14% verify [12 x 3.083 us]
14.000 us 3.46% demote_operations [6 x 2.333 us]
272.000 us 67.16% offload [6 x 45.333 us]
27.000 us 9.93% type_check [12 x 2.250 us]
245.000 us 90.07% [unaccounted]
21.000 us 5.19% [unaccounted]
383.000 us 48.36% offload_to_executable [6 x 63.833 us]
114.000 us 29.77% verify [54 x 2.111 us]
44.000 us 11.49% demote_atomics [12 x 3.667 us]
24.000 us 54.55% type_check [12 x 2.000 us]
20.000 us 45.45% [unaccounted]
13.000 us 3.39% cache_loop_invariant_global_vars [6 x 2.167 us]
39.000 us 10.18% type_check [18 x 2.167 us]
10.000 us 2.61% remove_range_assumption [6 x 1.667 us]
7.000 us 1.83% remove_loop_unique [6 x 1.167 us]
60.000 us 15.67% full_simplify [12 x 5.000 us]
28.000 us 46.67% simplify [12 x 2.333 us]
29.000 us 48.33% die [12 x 2.417 us]
3.000 us 5.00% [unaccounted]
12.000 us 3.13% die [6 x 2.000 us]
5.000 us 1.31% flag_access [6 x 833.330 ns]
9.000 us 2.35% demote_operations [6 x 1.500 us]
70.000 us 18.28% [unaccounted]
4.000 us 0.51% [unaccounted]
11.299 ms 93.45% [unaccounted]
161.932 ms 32.92% [unaccounted]
0.265 s 0.76% die [63 x 4.209 ms]
0.138 s 0.40% alg_simp [21 x 6.569 ms]
100.724 ms 73.01% replace_all_usages_with [574 x 175.477 us]
37.234 ms 26.99% [unaccounted]
0.036 s 0.10% loop_invariant_code_motion [21 x 1.724 ms]
24.222 ms 66.90% replace_all_usages_with [142 x 170.577 us]
11.983 ms 33.10% [unaccounted]
0.024 s 0.07% simplify [21 x 1.163 ms]
0.411 ms 1.68% replace_all_usages_with [7 x 58.714 us]
24.003 ms 98.32% [unaccounted]
4.845 s 13.94% whole_kernel_cse [21 x 230.691 ms]
1.006 s 20.76% replace_all_usages_with [5506 x 182.657 us]
3.839 s 79.24% [unaccounted]
28.846 s 83.03% cfg_optimization [15 x 1.923 s]
27.306 s 94.66% store_to_load_forwarding [25 x 1.092 s]
19.773 s 72.41% reaching_definition_analysis [25 x 790.900 ms]
2.355 s 8.62% replace_all_usages_with [14494 x 162.458 us]
5.179 s 18.97% [unaccounted]
1.107 s 3.84% dead_store_elimination [25 x 44.262 ms]
0.924 s 83.48% live_variable_analysis [25 x 36.950 ms]
0.008 s 0.72% replace_all_usages_with [62 x 128.435 us]
0.175 s 15.80% [unaccounted]
0.230 s 0.80% die [15 x 15.317 ms]
0.204 s 0.71% [unaccounted]
0.000 s 0.00% flag_access [4 x 65.750 us]
0.019 s 0.05% offload [2 x 9.590 ms]
0.124 ms 0.65% replace_all_usages_with [2 x 62.000 us]
2.419 ms 12.61% type_check [4 x 604.750 us]
16.637 ms 86.74% [unaccounted]
0.301 s 0.79% cfg_optimization [2 x 150.676 ms]
244.540 ms 81.15% store_to_load_forwarding [2 x 122.270 ms]
210.715 ms 86.17% reaching_definition_analysis [2 x 105.357 ms]
33.825 ms 13.83% [unaccounted]
39.968 ms 13.26% dead_store_elimination [2 x 19.984 ms]
36.305 ms 90.84% live_variable_analysis [2 x 18.153 ms]
3.663 ms 9.16% [unaccounted]
6.865 ms 2.28% die [2 x 3.432 ms]
9.980 ms 3.31% [unaccounted]
3.821 s 9.15% offload_to_executable [2 x 1.911 s]
0.120 s 3.15% verify [18 x 6.678 ms]
0.009 s 0.23% demote_atomics [4 x 2.238 ms]
2.030 ms 22.68% replace_all_usages_with [122 x 16.639 us]
2.292 ms 25.61% type_check [4 x 573.000 us]
4.629 ms 51.71% [unaccounted]
0.001 s 0.03% cache_loop_invariant_global_vars [2 x 585.000 us]
0.000 s 0.01% replace_all_usages_with [4 x 61.500 us]
0.004 s 0.10% type_check [6 x 638.333 us]
0.000 s 0.01% remove_range_assumption [2 x 133.000 us]
0.000 s 0.01% remove_loop_unique [2 x 127.000 us]
3.669 s 96.01% full_simplify [4 x 917.203 ms]
0.004 s 0.11% extract_constant [15 x 274.467 us]
0.001 s 0.04% unreachable_code_elimination [15 x 96.467 us]
0.004 s 0.11% binary_op_simplify [15 x 269.133 us]
0.024 ms 0.59% replace_all_usages_with [3 x 8.000 us]
4.013 ms 99.41% [unaccounted]
0.024 s 0.64% constant_fold [15 x 1.573 ms]
8.243 ms 34.93% compile [4 x 2.061 ms]
0.534 ms 6.48% compile_to_executable [4 x 133.500 us]
262.000 us 49.06% compile_to_offloads [4 x 65.500 us]
5.000 us 1.91% frontend_type_check [4 x 1.250 us]
10.000 us 3.82% lower_ast [4 x 2.500 us]
8.000 us 3.05% lower_matrix_ptr [4 x 2.000 us]
13.000 us 4.96% type_check [4 x 3.250 us]
27.000 us 10.31% verify [8 x 3.375 us]
6.000 us 2.29% demote_operations [4 x 1.500 us]
174.000 us 66.41% offload [4 x 43.500 us]
19.000 us 10.92% type_check [8 x 2.375 us]
155.000 us 89.08% [unaccounted]
19.000 us 7.25% [unaccounted]
267.000 us 50.00% offload_to_executable [4 x 66.750 us]
84.000 us 31.46% verify [36 x 2.333 us]
30.000 us 11.24% demote_atomics [8 x 3.750 us]
16.000 us 53.33% type_check [8 x 2.000 us]
14.000 us 46.67% [unaccounted]
10.000 us 3.75% cache_loop_invariant_global_vars [4 x 2.500 us]
27.000 us 10.11% type_check [12 x 2.250 us]
6.000 us 2.25% remove_range_assumption [4 x 1.500 us]
7.000 us 2.62% remove_loop_unique [4 x 1.750 us]
40.000 us 14.98% full_simplify [8 x 5.000 us]
16.000 us 40.00% simplify [8 x 2.000 us]
19.000 us 47.50% die [8 x 2.375 us]
5.000 us 12.50% [unaccounted]
8.000 us 3.00% die [4 x 2.000 us]
3.000 us 1.12% flag_access [4 x 749.998 ns]
5.000 us 1.87% demote_operations [4 x 1.250 us]
47.000 us 17.60% [unaccounted]
5.000 us 0.94% [unaccounted]
7.709 ms 93.52% [unaccounted]
2.502 ms 10.60% replace_all_usages_with [35 x 71.486 us]
12.857 ms 54.47% [unaccounted]
0.085 s 2.32% die [45 x 1.894 ms]
0.017 s 0.45% alg_simp [15 x 1.106 ms]
3.268 ms 19.70% replace_all_usages_with [85 x 38.447 us]
13.317 ms 80.30% [unaccounted]
0.002 s 0.05% loop_invariant_code_motion [15 x 125.200 us]
0.404 s 11.02% simplify [15 x 26.947 ms]
37.147 ms 9.19% replace_all_usages_with [578 x 64.268 us]
335.076 ms 82.90% type_check [578 x 579.716 us]
31.979 ms 7.91% [unaccounted]
1.437 s 39.16% whole_kernel_cse [15 x 95.781 ms]
0.300 s 20.87% replace_all_usages_with [3806 x 78.767 us]
1.137 s 79.13% [unaccounted]
1.691 s 46.09% cfg_optimization [11 x 153.722 ms]
1.460 s 86.33% store_to_load_forwarding [13 x 112.293 ms]
1.228 s 84.14% reaching_definition_analysis [13 x 94.483 ms]
0.002 s 0.16% replace_all_usages_with [89 x 27.056 us]
0.229 s 15.70% [unaccounted]
0.174 s 10.31% dead_store_elimination [13 x 13.410 ms]
155.336 ms 89.10% live_variable_analysis [13 x 11.949 ms]
19.000 ms 10.90% [unaccounted]
0.020 s 1.17% die [11 x 1.792 ms]
0.037 s 2.19% [unaccounted]
0.009 s 0.23% die [2 x 4.355 ms]
0.000 s 0.00% flag_access [2 x 78.000 us]
0.003 s 0.07% demote_operations [2 x 1.283 ms]
0.321 ms 12.51% replace_all_usages_with [5 x 64.200 us]
1.288 ms 50.19% type_check [2 x 644.000 us]
0.957 ms 37.30% [unaccounted]
0.990 s 2.32% [unaccounted]
>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>