| /* |
| * Copyright (C) 2011 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #include "profiler.h" |
| |
| #include <fstream> |
| #include <sys/uio.h> |
| #include <sys/file.h> |
| |
| #include "base/stl_util.h" |
| #include "base/unix_file/fd_file.h" |
| #include "class_linker.h" |
| #include "common_throws.h" |
| #include "debugger.h" |
| #include "dex_file-inl.h" |
| #include "instrumentation.h" |
| #include "mirror/art_method-inl.h" |
| #include "mirror/class-inl.h" |
| #include "mirror/dex_cache.h" |
| #include "mirror/object_array-inl.h" |
| #include "mirror/object-inl.h" |
| #include "object_utils.h" |
| #include "os.h" |
| #include "scoped_thread_state_change.h" |
| #include "ScopedLocalRef.h" |
| #include "thread.h" |
| #include "thread_list.h" |
| |
| #ifdef HAVE_ANDROID_OS |
| #include "cutils/properties.h" |
| #endif |
| |
| #if !defined(ART_USE_PORTABLE_COMPILER) |
| #include "entrypoints/quick/quick_entrypoints.h" |
| #endif |
| |
| namespace art { |
| |
| BackgroundMethodSamplingProfiler* BackgroundMethodSamplingProfiler::profiler_ = nullptr; |
| pthread_t BackgroundMethodSamplingProfiler::profiler_pthread_ = 0U; |
| volatile bool BackgroundMethodSamplingProfiler::shutting_down_ = false; |
| |
| |
| // TODO: this profiler runs regardless of the state of the machine. Maybe we should use the |
| // wakelock or something to modify the run characteristics. This can be done when we |
| // have some performance data after it's been used for a while. |
| |
| |
| // This is called from either a thread list traversal or from a checkpoint. Regardless |
| // of which caller, the mutator lock must be held. |
| static void GetSample(Thread* thread, void* arg) SHARED_LOCKS_REQUIRED(Locks::mutator_lock_) { |
| BackgroundMethodSamplingProfiler* profiler = |
| reinterpret_cast<BackgroundMethodSamplingProfiler*>(arg); |
| mirror::ArtMethod* method = thread->GetCurrentMethod(nullptr); |
| if (false && method == nullptr) { |
| LOG(INFO) << "No current method available"; |
| std::ostringstream os; |
| thread->Dump(os); |
| std::string data(os.str()); |
| LOG(INFO) << data; |
| } |
| profiler->RecordMethod(method); |
| } |
| |
| |
| |
| // A closure that is called by the thread checkpoint code. |
| class SampleCheckpoint : public Closure { |
| public: |
| explicit SampleCheckpoint(BackgroundMethodSamplingProfiler* const profiler) : |
| profiler_(profiler) {} |
| |
| virtual void Run(Thread* thread) NO_THREAD_SAFETY_ANALYSIS { |
| Thread* self = Thread::Current(); |
| if (thread == nullptr) { |
| LOG(ERROR) << "Checkpoint with nullptr thread"; |
| return; |
| } |
| |
| // Grab the mutator lock (shared access). |
| ScopedObjectAccess soa(self); |
| |
| // Grab a sample. |
| GetSample(thread, this->profiler_); |
| |
| // And finally tell the barrier that we're done. |
| this->profiler_->GetBarrier().Pass(self); |
| } |
| |
| private: |
| BackgroundMethodSamplingProfiler* const profiler_; |
| }; |
| |
| bool BackgroundMethodSamplingProfiler::ShuttingDown(Thread* self) { |
| MutexLock mu(self, *Locks::profiler_lock_); |
| return shutting_down_; |
| } |
| |
| void* BackgroundMethodSamplingProfiler::RunProfilerThread(void* arg) { |
| Runtime* runtime = Runtime::Current(); |
| BackgroundMethodSamplingProfiler* profiler = |
| reinterpret_cast<BackgroundMethodSamplingProfiler*>(arg); |
| |
| // Add a random delay for the first time run so that we don't hammer the CPU |
| // with all profiles running at the same time. |
| const int kRandomDelayMaxSecs = 30; |
| const double kMaxBackoffSecs = 24*60*60; // Max backoff time. |
| |
| srand(MicroTime() * getpid()); |
| int startup_delay = rand() % kRandomDelayMaxSecs; // random delay for startup. |
| |
| |
| CHECK(runtime->AttachCurrentThread("Profiler", true, runtime->GetSystemThreadGroup(), |
| !runtime->IsCompiler())); |
| |
| Thread* self = Thread::Current(); |
| |
| while (true) { |
| if (ShuttingDown(self)) { |
| break; |
| } |
| |
| { |
| // wait until we need to run another profile |
| uint64_t delay_secs = profiler->period_s_ * profiler->backoff_factor_; |
| |
| // Add a startup delay to prevent all the profiles running at once. |
| delay_secs += startup_delay; |
| |
| // Immediate startup for benchmarking? |
| if (profiler->start_immediately_ && startup_delay > 0) { |
| delay_secs = 0; |
| } |
| |
| startup_delay = 0; |
| |
| VLOG(profiler) << "Delaying profile start for " << delay_secs << " secs"; |
| MutexLock mu(self, profiler->wait_lock_); |
| profiler->period_condition_.TimedWait(self, delay_secs * 1000, 0); |
| |
| // Expand the backoff by its coefficient, but don't go beyond the max. |
| double new_backoff = profiler->backoff_factor_ * profiler->backoff_coefficient_; |
| if (new_backoff < kMaxBackoffSecs) { |
| profiler->backoff_factor_ = new_backoff; |
| } |
| } |
| |
| if (ShuttingDown(self)) { |
| break; |
| } |
| |
| |
| uint64_t start_us = MicroTime(); |
| uint64_t end_us = start_us + profiler->duration_s_ * UINT64_C(1000000); |
| uint64_t now_us = start_us; |
| |
| VLOG(profiler) << "Starting profiling run now for " << PrettyDuration((end_us - start_us) * 1000); |
| |
| |
| SampleCheckpoint check_point(profiler); |
| |
| size_t valid_samples = 0; |
| while (now_us < end_us) { |
| if (ShuttingDown(self)) { |
| break; |
| } |
| |
| usleep(profiler->interval_us_); // Non-interruptible sleep. |
| |
| ThreadList* thread_list = runtime->GetThreadList(); |
| |
| profiler->profiler_barrier_->Init(self, 0); |
| size_t barrier_count = thread_list->RunCheckpointOnRunnableThreads(&check_point); |
| |
| // All threads are suspended, nothing to do. |
| if (barrier_count == 0) { |
| now_us = MicroTime(); |
| continue; |
| } |
| |
| valid_samples += barrier_count; |
| |
| ThreadState old_state = self->SetState(kWaitingForCheckPointsToRun); |
| |
| // Wait for the barrier to be crossed by all runnable threads. This wait |
| // is done with a timeout so that we can detect problems with the checkpoint |
| // running code. We should never see this. |
| const uint32_t kWaitTimeoutMs = 10000; |
| const uint32_t kWaitTimeoutUs = kWaitTimeoutMs * 1000; |
| |
| uint64_t waitstart_us = MicroTime(); |
| // Wait for all threads to pass the barrier. |
| profiler->profiler_barrier_->Increment(self, barrier_count, kWaitTimeoutMs); |
| uint64_t waitend_us = MicroTime(); |
| uint64_t waitdiff_us = waitend_us - waitstart_us; |
| |
| // We should never get a timeout. If we do, it suggests a problem with the checkpoint |
| // code. Crash the process in this case. |
| CHECK_LT(waitdiff_us, kWaitTimeoutUs); |
| |
| self->SetState(old_state); |
| |
| // Update the current time. |
| now_us = MicroTime(); |
| } |
| |
| if (valid_samples > 0 && !ShuttingDown(self)) { |
| // After the profile has been taken, write it out. |
| ScopedObjectAccess soa(self); // Acquire the mutator lock. |
| uint32_t size = profiler->WriteProfile(); |
| VLOG(profiler) << "Profile size: " << size; |
| } |
| } |
| |
| LOG(INFO) << "Profiler shutdown"; |
| runtime->DetachCurrentThread(); |
| return nullptr; |
| } |
| |
| // Write out the profile file if we are generating a profile. |
| uint32_t BackgroundMethodSamplingProfiler::WriteProfile() { |
| std::string full_name = profile_file_name_; |
| VLOG(profiler) << "Saving profile to " << full_name; |
| |
| int fd = open(full_name.c_str(), O_RDWR); |
| if (fd < 0) { |
| // Open failed. |
| LOG(ERROR) << "Failed to open profile file " << full_name; |
| return 0; |
| } |
| |
| // Lock the file for exclusive access. This will block if another process is using |
| // the file. |
| int err = flock(fd, LOCK_EX); |
| if (err < 0) { |
| LOG(ERROR) << "Failed to lock profile file " << full_name; |
| return 0; |
| } |
| |
| // Read the previous profile. |
| profile_table_.ReadPrevious(fd); |
| |
| // Move back to the start of the file. |
| lseek(fd, 0, SEEK_SET); |
| |
| // Format the profile output and write to the file. |
| std::ostringstream os; |
| uint32_t num_methods = DumpProfile(os); |
| std::string data(os.str()); |
| const char *p = data.c_str(); |
| size_t length = data.length(); |
| size_t full_length = length; |
| do { |
| int n = ::write(fd, p, length); |
| p += n; |
| length -= n; |
| } while (length > 0); |
| |
| // Truncate the file to the new length. |
| ftruncate(fd, full_length); |
| |
| // Now unlock the file, allowing another process in. |
| err = flock(fd, LOCK_UN); |
| if (err < 0) { |
| LOG(ERROR) << "Failed to unlock profile file " << full_name; |
| } |
| |
| // Done, close the file. |
| ::close(fd); |
| |
| // Clean the profile for the next time. |
| CleanProfile(); |
| |
| return num_methods; |
| } |
| |
| // Start a profile thread with the user-supplied arguments. |
| void BackgroundMethodSamplingProfiler::Start(int period, int duration, |
| const std::string& profile_file_name, const std::string& procName, |
| int interval_us, |
| double backoff_coefficient, bool startImmediately) { |
| Thread* self = Thread::Current(); |
| { |
| MutexLock mu(self, *Locks::profiler_lock_); |
| // Don't start two profiler threads. |
| if (profiler_ != nullptr) { |
| return; |
| } |
| } |
| |
| // Only on target... |
| #ifdef HAVE_ANDROID_OS |
| // Switch off profiler if the dalvik.vm.profiler property has value 0. |
| char buf[PROP_VALUE_MAX]; |
| property_get("dalvik.vm.profiler", buf, "0"); |
| if (strcmp(buf, "0") == 0) { |
| LOG(INFO) << "Profiler disabled. To enable setprop dalvik.vm.profiler 1"; |
| return; |
| } |
| #endif |
| |
| LOG(INFO) << "Starting profile with period " << period << "s, duration " << duration << |
| "s, interval " << interval_us << "us. Profile file " << profile_file_name; |
| |
| { |
| MutexLock mu(self, *Locks::profiler_lock_); |
| profiler_ = new BackgroundMethodSamplingProfiler(period, duration, profile_file_name, |
| procName, |
| backoff_coefficient, |
| interval_us, startImmediately); |
| |
| CHECK_PTHREAD_CALL(pthread_create, (&profiler_pthread_, nullptr, &RunProfilerThread, |
| reinterpret_cast<void*>(profiler_)), |
| "Profiler thread"); |
| } |
| } |
| |
| |
| |
| void BackgroundMethodSamplingProfiler::Stop() { |
| BackgroundMethodSamplingProfiler* profiler = nullptr; |
| pthread_t profiler_pthread = 0U; |
| { |
| MutexLock trace_mu(Thread::Current(), *Locks::profiler_lock_); |
| profiler = profiler_; |
| shutting_down_ = true; |
| profiler_pthread = profiler_pthread_; |
| } |
| |
| // Now wake up the sampler thread if it sleeping. |
| { |
| MutexLock profile_mu(Thread::Current(), profiler->wait_lock_); |
| profiler->period_condition_.Signal(Thread::Current()); |
| } |
| // Wait for the sample thread to stop. |
| CHECK_PTHREAD_CALL(pthread_join, (profiler_pthread, nullptr), "profiler thread shutdown"); |
| |
| { |
| MutexLock mu(Thread::Current(), *Locks::profiler_lock_); |
| profiler_ = nullptr; |
| } |
| delete profiler; |
| } |
| |
| |
| void BackgroundMethodSamplingProfiler::Shutdown() { |
| Stop(); |
| } |
| |
| BackgroundMethodSamplingProfiler::BackgroundMethodSamplingProfiler(int period, int duration, |
| const std::string& profile_file_name, |
| const std::string& process_name, |
| double backoff_coefficient, int interval_us, bool startImmediately) |
| : profile_file_name_(profile_file_name), process_name_(process_name), |
| period_s_(period), start_immediately_(startImmediately), |
| interval_us_(interval_us), backoff_factor_(1.0), |
| backoff_coefficient_(backoff_coefficient), duration_s_(duration), |
| wait_lock_("Profile wait lock"), |
| period_condition_("Profile condition", wait_lock_), |
| profile_table_(wait_lock_), |
| profiler_barrier_(new Barrier(0)) { |
| // Populate the filtered_methods set. |
| // This is empty right now, but to add a method, do this: |
| // |
| // filtered_methods_.insert("void java.lang.Object.wait(long, int)"); |
| } |
| |
| // A method has been hit, record its invocation in the method map. |
| // The mutator_lock must be held (shared) when this is called. |
| void BackgroundMethodSamplingProfiler::RecordMethod(mirror::ArtMethod* method) { |
| if (method == nullptr) { |
| profile_table_.NullMethod(); |
| // Don't record a nullptr method. |
| return; |
| } |
| |
| mirror::Class* cls = method->GetDeclaringClass(); |
| if (cls != nullptr) { |
| if (cls->GetClassLoader() == nullptr) { |
| // Don't include things in the boot |
| profile_table_.BootMethod(); |
| return; |
| } |
| } |
| |
| bool is_filtered = false; |
| |
| MethodHelper mh(method); |
| if (strcmp(mh.GetName(), "<clinit>") == 0) { |
| // always filter out class init |
| is_filtered = true; |
| } |
| |
| // Filter out methods by name if there are any. |
| if (!is_filtered && filtered_methods_.size() > 0) { |
| std::string method_full_name = PrettyMethod(method); |
| |
| // Don't include specific filtered methods. |
| is_filtered = filtered_methods_.count(method_full_name) != 0; |
| } |
| |
| // Add to the profile table unless it is filtered out. |
| if (!is_filtered) { |
| profile_table_.Put(method); |
| } |
| } |
| |
| // Clean out any recordings for the method traces. |
| void BackgroundMethodSamplingProfiler::CleanProfile() { |
| profile_table_.Clear(); |
| } |
| |
| uint32_t BackgroundMethodSamplingProfiler::DumpProfile(std::ostream& os) { |
| return profile_table_.Write(os); |
| } |
| |
| // Profile Table. |
| // This holds a mapping of mirror::ArtMethod* to a count of how many times a sample |
| // hit it at the top of the stack. |
| ProfileSampleResults::ProfileSampleResults(Mutex& lock) : lock_(lock), num_samples_(0), |
| num_null_methods_(0), |
| num_boot_methods_(0) { |
| for (int i = 0; i < kHashSize; i++) { |
| table[i] = nullptr; |
| } |
| } |
| |
| ProfileSampleResults::~ProfileSampleResults() { |
| for (int i = 0; i < kHashSize; i++) { |
| delete table[i]; |
| } |
| } |
| |
| // Add a method to the profile table. If it the first time the method |
| // has been seen, add it with count=1, otherwise increment the count. |
| void ProfileSampleResults::Put(mirror::ArtMethod* method) { |
| lock_.Lock(Thread::Current()); |
| uint32_t index = Hash(method); |
| if (table[index] == nullptr) { |
| table[index] = new Map(); |
| } |
| Map::iterator i = table[index]->find(method); |
| if (i == table[index]->end()) { |
| (*table[index])[method] = 1; |
| } else { |
| i->second++; |
| } |
| num_samples_++; |
| lock_.Unlock(Thread::Current()); |
| } |
| |
| // Write the profile table to the output stream. Also merge with the previous profile. |
| uint32_t ProfileSampleResults::Write(std::ostream &os) { |
| ScopedObjectAccess soa(Thread::Current()); |
| num_samples_ += previous_num_samples_; |
| num_null_methods_ += previous_num_null_methods_; |
| num_boot_methods_ += previous_num_boot_methods_; |
| |
| VLOG(profiler) << "Profile: " << num_samples_ << "/" << num_null_methods_ << "/" << num_boot_methods_; |
| os << num_samples_ << "/" << num_null_methods_ << "/" << num_boot_methods_ << "\n"; |
| uint32_t num_methods = 0; |
| for (int i = 0 ; i < kHashSize; i++) { |
| Map *map = table[i]; |
| if (map != nullptr) { |
| for (const auto &meth_iter : *map) { |
| mirror::ArtMethod *method = meth_iter.first; |
| std::string method_name = PrettyMethod(method); |
| |
| MethodHelper mh(method); |
| const DexFile::CodeItem* codeitem = mh.GetCodeItem(); |
| uint32_t method_size = 0; |
| if (codeitem != nullptr) { |
| method_size = codeitem->insns_size_in_code_units_; |
| } |
| uint32_t count = meth_iter.second; |
| |
| // Merge this profile entry with one from a previous run (if present). Also |
| // remove the previous entry. |
| PreviousProfile::iterator pi = previous_.find(method_name); |
| if (pi != previous_.end()) { |
| count += pi->second.count_; |
| previous_.erase(pi); |
| } |
| os << StringPrintf("%s/%u/%u\n", method_name.c_str(), count, method_size); |
| ++num_methods; |
| } |
| } |
| } |
| |
| // Now we write out the remaining previous methods. |
| for (PreviousProfile::iterator pi = previous_.begin(); pi != previous_.end(); ++pi) { |
| os << StringPrintf("%s/%u/%u\n", pi->first.c_str(), pi->second.count_, pi->second.method_size_); |
| ++num_methods; |
| } |
| return num_methods; |
| } |
| |
| void ProfileSampleResults::Clear() { |
| num_samples_ = 0; |
| num_null_methods_ = 0; |
| num_boot_methods_ = 0; |
| for (int i = 0; i < kHashSize; i++) { |
| delete table[i]; |
| table[i] = nullptr; |
| } |
| previous_.clear(); |
| } |
| |
| uint32_t ProfileSampleResults::Hash(mirror::ArtMethod* method) { |
| return (PointerToLowMemUInt32(method) >> 3) % kHashSize; |
| } |
| |
| // Read a single line into the given string. Returns true if everything OK, false |
| // on EOF or error. |
| static bool ReadProfileLine(int fd, std::string& line) { |
| char buf[4]; |
| line.clear(); |
| while (true) { |
| int n = read(fd, buf, 1); // TODO: could speed this up but is it worth it? |
| if (n != 1) { |
| return false; |
| } |
| if (buf[0] == '\n') { |
| break; |
| } |
| line += buf[0]; |
| } |
| return true; |
| } |
| |
| void ProfileSampleResults::ReadPrevious(int fd) { |
| // Reset counters. |
| previous_num_samples_ = previous_num_null_methods_ = previous_num_boot_methods_ = 0; |
| |
| std::string line; |
| |
| // The first line contains summary information. |
| if (!ReadProfileLine(fd, line)) { |
| return; |
| } |
| std::vector<std::string> summary_info; |
| Split(line, '/', summary_info); |
| if (summary_info.size() != 3) { |
| // Bad summary info. It should be count/nullcount/bootcount |
| return; |
| } |
| previous_num_samples_ = atoi(summary_info[0].c_str()); |
| previous_num_null_methods_ = atoi(summary_info[1].c_str()); |
| previous_num_boot_methods_ = atoi(summary_info[2].c_str()); |
| |
| // Now read each line until the end of file. Each line consists of 3 fields separated by / |
| while (true) { |
| if (!ReadProfileLine(fd, line)) { |
| break; |
| } |
| std::vector<std::string> info; |
| Split(line, '/', info); |
| if (info.size() != 3) { |
| // Malformed. |
| break; |
| } |
| std::string methodname = info[0]; |
| uint32_t count = atoi(info[1].c_str()); |
| uint32_t size = atoi(info[2].c_str()); |
| previous_[methodname] = PreviousValue(count, size); |
| } |
| } |
| |
| bool ProfileHelper::LoadProfileMap(ProfileMap& profileMap, const std::string& fileName) { |
| LOG(VERBOSE) << "reading profile file " << fileName; |
| struct stat st; |
| int err = stat(fileName.c_str(), &st); |
| if (err == -1) { |
| LOG(VERBOSE) << "not found"; |
| return false; |
| } |
| if (st.st_size == 0) { |
| return false; // Empty profiles are invalid. |
| } |
| std::ifstream in(fileName.c_str()); |
| if (!in) { |
| LOG(VERBOSE) << "profile file " << fileName << " exists but can't be opened"; |
| LOG(VERBOSE) << "file owner: " << st.st_uid << ":" << st.st_gid; |
| LOG(VERBOSE) << "me: " << getuid() << ":" << getgid(); |
| LOG(VERBOSE) << "file permissions: " << std::oct << st.st_mode; |
| LOG(VERBOSE) << "errno: " << errno; |
| return false; |
| } |
| // The first line contains summary information. |
| std::string line; |
| std::getline(in, line); |
| if (in.eof()) { |
| return false; |
| } |
| std::vector<std::string> summary_info; |
| Split(line, '/', summary_info); |
| if (summary_info.size() != 3) { |
| // Bad summary info. It should be count/total/bootpath. |
| return false; |
| } |
| // This is the number of hits in all methods. |
| uint32_t total_count = 0; |
| for (int i = 0 ; i < 3; ++i) { |
| total_count += atoi(summary_info[i].c_str()); |
| } |
| |
| // Now read each line until the end of file. Each line consists of 3 fields separated by '/'. |
| // Store the info in descending order given by the most used methods. |
| typedef std::set<std::pair<int, std::vector<std::string>>> ProfileSet; |
| ProfileSet countSet; |
| while (!in.eof()) { |
| std::getline(in, line); |
| if (in.eof()) { |
| break; |
| } |
| std::vector<std::string> info; |
| Split(line, '/', info); |
| if (info.size() != 3) { |
| // Malformed. |
| break; |
| } |
| int count = atoi(info[1].c_str()); |
| countSet.insert(std::make_pair(-count, info)); |
| } |
| |
| uint32_t curTotalCount = 0; |
| ProfileSet::iterator end = countSet.end(); |
| const ProfileData* prevData = nullptr; |
| for (ProfileSet::iterator it = countSet.begin(); it != end ; it++) { |
| const std::string& methodname = it->second[0]; |
| uint32_t count = -it->first; |
| uint32_t size = atoi(it->second[2].c_str()); |
| double usedPercent = (count * 100.0) / total_count; |
| |
| curTotalCount += count; |
| // Methods with the same count should be part of the same top K percentage bucket. |
| double topKPercentage = (prevData != nullptr) && (prevData->GetCount() == count) |
| ? prevData->GetTopKUsedPercentage() |
| : 100 * static_cast<double>(curTotalCount) / static_cast<double>(total_count); |
| |
| // Add it to the profile map. |
| ProfileData curData = ProfileData(methodname, count, size, usedPercent, topKPercentage); |
| profileMap[methodname] = curData; |
| prevData = &curData; |
| } |
| return true; |
| } |
| |
| bool ProfileHelper::LoadTopKSamples(std::set<std::string>& topKSamples, const std::string& fileName, |
| double topKPercentage) { |
| ProfileMap profileMap; |
| bool loadOk = LoadProfileMap(profileMap, fileName); |
| if (!loadOk) { |
| return false; |
| } |
| ProfileMap::iterator end = profileMap.end(); |
| for (ProfileMap::iterator it = profileMap.begin(); it != end; it++) { |
| if (it->second.GetTopKUsedPercentage() < topKPercentage) { |
| topKSamples.insert(it->first); |
| } |
| } |
| return true; |
| } |
| |
| } // namespace art |