blob: 0f20a99f051fa28ed90b9e6e29be12c66eefc2cd [file] [log] [blame]
Mathieu Chartieref2fa262018-04-12 15:14:07 -07001/*
2 * Copyright (C) 2018 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17#include "dexanalyze_experiments.h"
Mathieu Chartier35ddc6f2018-05-09 11:34:07 -070018
19#include <stdint.h>
20#include <inttypes.h>
21#include <iostream>
22#include <map>
23#include <vector>
24
25#include "android-base/stringprintf.h"
Mathieu Chartierc2b4db62018-05-18 13:58:12 -070026#include "dex/class_accessor-inl.h"
Mathieu Chartier05dc23e2018-05-22 11:56:14 -070027#include "dex/class_iterator.h"
Mathieu Chartieref2fa262018-04-12 15:14:07 -070028#include "dex/code_item_accessors-inl.h"
29#include "dex/dex_instruction-inl.h"
30#include "dex/standard_dex_file.h"
Mathieu Chartierf2759792018-05-18 13:16:54 -070031#include "dex/utf-inl.h"
Mathieu Chartieref2fa262018-04-12 15:14:07 -070032
33namespace art {
34
Mathieu Chartier35ddc6f2018-05-09 11:34:07 -070035std::string Percent(uint64_t value, uint64_t max) {
36 if (max == 0) {
37 ++max;
38 }
39 return android::base::StringPrintf("%" PRId64 "(%.2f%%)",
40 value,
41 static_cast<double>(value * 100) / static_cast<double>(max));
42}
43
44static size_t PrefixLen(const std::string& a, const std::string& b) {
45 size_t len = 0;
46 for (; len < a.length() && len < b.length() && a[len] == b[len]; ++len) {}
47 return len;
48}
49
50void AnalyzeStrings::ProcessDexFile(const DexFile& dex_file) {
51 std::vector<std::string> strings;
52 for (size_t i = 0; i < dex_file.NumStringIds(); ++i) {
53 uint32_t length = 0;
Mathieu Chartierf2759792018-05-18 13:16:54 -070054 const char* data = dex_file.StringDataAndUtf16LengthByIdx(dex::StringIndex(i), &length);
55 // Analyze if the string has any UTF16 chars.
56 bool have_wide_char = false;
57 const char* ptr = data;
58 for (size_t j = 0; j < length; ++j) {
59 have_wide_char = have_wide_char || GetUtf16FromUtf8(&ptr) >= 0x100;
60 }
61 if (have_wide_char) {
62 wide_string_bytes_ += 2 * length;
63 } else {
64 ascii_string_bytes_ += length;
65 }
66 string_data_bytes_ += ptr - data;
67
Mathieu Chartier35ddc6f2018-05-09 11:34:07 -070068 strings.push_back(data);
69 }
70 // Note that the strings are probably already sorted.
71 std::sort(strings.begin(), strings.end());
72
73 // Tunable parameters.
74 static const size_t kMinPrefixLen = 3;
75 static const size_t kPrefixConstantCost = 5;
76 static const size_t kPrefixIndexCost = 2;
77
78 // Calculate total shared prefix.
79 std::vector<size_t> shared_len;
80 std::set<std::string> prefixes;
81 for (size_t i = 0; i < strings.size(); ++i) {
82 size_t best_len = 0;
83 if (i > 0) {
84 best_len = std::max(best_len, PrefixLen(strings[i], strings[i - 1]));
85 }
86 if (i < strings.size() - 1) {
87 best_len = std::max(best_len, PrefixLen(strings[i], strings[i + 1]));
88 }
89 std::string prefix;
90 if (best_len >= kMinPrefixLen) {
91 prefix = strings[i].substr(0, best_len);
92 prefixes.insert(prefix);
93 total_prefix_savings_ += prefix.length();
94 }
95 total_prefix_index_cost_ += kPrefixIndexCost;
96 }
97 total_num_prefixes_ += prefixes.size();
98 for (const std::string& s : prefixes) {
99 // 4 bytes for an offset, one for length.
100 total_prefix_dict_ += s.length();
101 total_prefix_table_ += kPrefixConstantCost;
102 }
103}
104
105void AnalyzeStrings::Dump(std::ostream& os, uint64_t total_size) const {
Mathieu Chartierf2759792018-05-18 13:16:54 -0700106 os << "Total string data bytes " << Percent(string_data_bytes_, total_size) << "\n";
107 os << "UTF-16 string data bytes " << Percent(wide_string_bytes_, total_size) << "\n";
108 os << "ASCII string data bytes " << Percent(ascii_string_bytes_, total_size) << "\n";
109
110 // Prefix based strings.
Mathieu Chartier35ddc6f2018-05-09 11:34:07 -0700111 os << "Total shared prefix bytes " << Percent(total_prefix_savings_, total_size) << "\n";
112 os << "Prefix dictionary cost " << Percent(total_prefix_dict_, total_size) << "\n";
113 os << "Prefix table cost " << Percent(total_prefix_table_, total_size) << "\n";
114 os << "Prefix index cost " << Percent(total_prefix_index_cost_, total_size) << "\n";
115 int64_t net_savings = total_prefix_savings_;
116 net_savings -= total_prefix_dict_;
117 net_savings -= total_prefix_table_;
118 net_savings -= total_prefix_index_cost_;
119 os << "Prefix net savings " << Percent(net_savings, total_size) << "\n";
120 os << "Prefix dictionary elements " << total_num_prefixes_ << "\n";
121}
122
Mathieu Chartieref2fa262018-04-12 15:14:07 -0700123void CountDexIndices::ProcessDexFile(const DexFile& dex_file) {
124 num_string_ids_ += dex_file.NumStringIds();
125 num_method_ids_ += dex_file.NumMethodIds();
126 num_field_ids_ += dex_file.NumFieldIds();
127 num_type_ids_ += dex_file.NumTypeIds();
128 num_class_defs_ += dex_file.NumClassDefs();
Mathieu Chartier7c3a8c12018-05-23 18:09:45 -0700129 std::set<size_t> unique_code_items;
Mathieu Chartier05dc23e2018-05-22 11:56:14 -0700130 for (ClassAccessor accessor : dex_file.GetClasses()) {
Mathieu Chartieref2fa262018-04-12 15:14:07 -0700131 std::set<size_t> unique_method_ids;
132 std::set<size_t> unique_string_ids;
Mathieu Chartier0d896bd2018-05-25 00:20:27 -0700133 for (const ClassAccessor::Method& method : accessor.GetMethods()) {
Mathieu Chartier05dc23e2018-05-22 11:56:14 -0700134 dex_code_bytes_ += method.GetInstructions().InsnsSizeInBytes();
Mathieu Chartier7c3a8c12018-05-23 18:09:45 -0700135 unique_code_items.insert(method.GetCodeItemOffset());
Mathieu Chartier05dc23e2018-05-22 11:56:14 -0700136 for (const DexInstructionPcPair& inst : method.GetInstructions()) {
Mathieu Chartierc2b4db62018-05-18 13:58:12 -0700137 switch (inst->Opcode()) {
138 case Instruction::CONST_STRING: {
139 const dex::StringIndex string_index(inst->VRegB_21c());
140 unique_string_ids.insert(string_index.index_);
141 ++num_string_ids_from_code_;
142 break;
Mathieu Chartieref2fa262018-04-12 15:14:07 -0700143 }
Mathieu Chartierc2b4db62018-05-18 13:58:12 -0700144 case Instruction::CONST_STRING_JUMBO: {
145 const dex::StringIndex string_index(inst->VRegB_31c());
146 unique_string_ids.insert(string_index.index_);
147 ++num_string_ids_from_code_;
148 break;
149 }
150 // Invoke cases.
151 case Instruction::INVOKE_VIRTUAL:
152 case Instruction::INVOKE_VIRTUAL_RANGE: {
153 bool is_range = (inst->Opcode() == Instruction::INVOKE_VIRTUAL_RANGE);
154 uint32_t method_idx = is_range ? inst->VRegB_3rc() : inst->VRegB_35c();
Mathieu Chartierc8c8d5f2018-05-22 11:56:14 -0700155 if (dex_file.GetMethodId(method_idx).class_idx_ == accessor.GetClassIdx()) {
Mathieu Chartierc2b4db62018-05-18 13:58:12 -0700156 ++same_class_virtual_;
157 } else {
158 ++other_class_virtual_;
159 unique_method_ids.insert(method_idx);
160 }
161 break;
162 }
163 case Instruction::INVOKE_DIRECT:
164 case Instruction::INVOKE_DIRECT_RANGE: {
165 bool is_range = (inst->Opcode() == Instruction::INVOKE_DIRECT_RANGE);
166 uint32_t method_idx = (is_range) ? inst->VRegB_3rc() : inst->VRegB_35c();
Mathieu Chartierc8c8d5f2018-05-22 11:56:14 -0700167 if (dex_file.GetMethodId(method_idx).class_idx_ == accessor.GetClassIdx()) {
Mathieu Chartierc2b4db62018-05-18 13:58:12 -0700168 ++same_class_direct_;
169 } else {
170 ++other_class_direct_;
171 unique_method_ids.insert(method_idx);
172 }
173 break;
174 }
175 case Instruction::INVOKE_STATIC:
176 case Instruction::INVOKE_STATIC_RANGE: {
177 bool is_range = (inst->Opcode() == Instruction::INVOKE_STATIC_RANGE);
178 uint32_t method_idx = (is_range) ? inst->VRegB_3rc() : inst->VRegB_35c();
Mathieu Chartierc8c8d5f2018-05-22 11:56:14 -0700179 if (dex_file.GetMethodId(method_idx).class_idx_ == accessor.GetClassIdx()) {
Mathieu Chartierc2b4db62018-05-18 13:58:12 -0700180 ++same_class_static_;
181 } else {
182 ++other_class_static_;
183 unique_method_ids.insert(method_idx);
184 }
185 break;
186 }
187 default:
188 break;
Mathieu Chartieref2fa262018-04-12 15:14:07 -0700189 }
190 }
Mathieu Chartier0d896bd2018-05-25 00:20:27 -0700191 }
Mathieu Chartieref2fa262018-04-12 15:14:07 -0700192 total_unique_method_idx_ += unique_method_ids.size();
193 total_unique_string_ids_ += unique_string_ids.size();
194 }
Mathieu Chartier7c3a8c12018-05-23 18:09:45 -0700195 total_unique_code_items_ += unique_code_items.size();
Mathieu Chartieref2fa262018-04-12 15:14:07 -0700196}
197
Mathieu Chartier35ddc6f2018-05-09 11:34:07 -0700198void CountDexIndices::Dump(std::ostream& os, uint64_t total_size) const {
Mathieu Chartieref2fa262018-04-12 15:14:07 -0700199 os << "Num string ids: " << num_string_ids_ << "\n";
200 os << "Num method ids: " << num_method_ids_ << "\n";
201 os << "Num field ids: " << num_field_ids_ << "\n";
202 os << "Num type ids: " << num_type_ids_ << "\n";
203 os << "Num class defs: " << num_class_defs_ << "\n";
204 os << "Same class direct: " << same_class_direct_ << "\n";
205 os << "Other class direct: " << other_class_direct_ << "\n";
206 os << "Same class virtual: " << same_class_virtual_ << "\n";
207 os << "Other class virtual: " << other_class_virtual_ << "\n";
208 os << "Same class static: " << same_class_static_ << "\n";
209 os << "Other class static: " << other_class_static_ << "\n";
210 os << "Num strings accessed from code: " << num_string_ids_from_code_ << "\n";
211 os << "Unique(per class) method ids accessed from code: " << total_unique_method_idx_ << "\n";
212 os << "Unique(per class) string ids accessed from code: " << total_unique_string_ids_ << "\n";
213 size_t same_class_total = same_class_direct_ + same_class_virtual_ + same_class_static_;
214 size_t other_class_total = other_class_direct_ + other_class_virtual_ + other_class_static_;
215 os << "Same class invoke: " << same_class_total << "\n";
216 os << "Other class invoke: " << other_class_total << "\n";
217 os << "Invokes from code: " << (same_class_total + other_class_total) << "\n";
Mathieu Chartier7c3a8c12018-05-23 18:09:45 -0700218 os << "Total Dex code bytes: " << Percent(dex_code_bytes_, total_size) << "\n";
219 os << "Total unique code items: " << total_unique_code_items_ << "\n";
220 os << "Total Dex size: " << total_size << "\n";
Mathieu Chartieref2fa262018-04-12 15:14:07 -0700221}
222
223} // namespace art
224