blob: 22522016cca5fd9505b90b3fc94415a34259aa12 [file] [log] [blame]
Yao Chen44cf27c2017-09-14 22:32:50 -07001/*
2 * Copyright (C) 2017 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
Yao Chen44cf27c2017-09-14 22:32:50 -070017#define DEBUG true // STOPSHIP if true
Joe Onorato9fc9edf2017-10-15 20:08:52 -070018#include "Log.h"
Yao Chen44cf27c2017-09-14 22:32:50 -070019
Yang Lu3eba6212017-10-25 19:54:45 -070020#include "../anomaly/DiscreteAnomalyTracker.h"
Yao Chen729093d2017-10-16 10:33:26 -070021#include "CountMetricProducer.h"
22#include "stats_util.h"
Yao Chen44cf27c2017-09-14 22:32:50 -070023
Yao Chen44cf27c2017-09-14 22:32:50 -070024#include <limits.h>
25#include <stdlib.h>
26
yrob0378b02017-11-09 20:36:25 -080027using android::util::FIELD_COUNT_REPEATED;
yro2b0f8862017-11-06 14:27:31 -080028using android::util::FIELD_TYPE_BOOL;
29using android::util::FIELD_TYPE_FLOAT;
30using android::util::FIELD_TYPE_INT32;
31using android::util::FIELD_TYPE_INT64;
32using android::util::FIELD_TYPE_MESSAGE;
yro24809bd2017-10-31 23:06:53 -070033using android::util::ProtoOutputStream;
Yao Chen729093d2017-10-16 10:33:26 -070034using std::map;
35using std::string;
Yao Chen44cf27c2017-09-14 22:32:50 -070036using std::unordered_map;
Yao Chen729093d2017-10-16 10:33:26 -070037using std::vector;
Yao Chen44cf27c2017-09-14 22:32:50 -070038
39namespace android {
40namespace os {
41namespace statsd {
42
yro24809bd2017-10-31 23:06:53 -070043// for StatsLogReport
44const int FIELD_ID_METRIC_ID = 1;
45const int FIELD_ID_START_REPORT_NANOS = 2;
46const int FIELD_ID_END_REPORT_NANOS = 3;
47const int FIELD_ID_COUNT_METRICS = 5;
48// for CountMetricDataWrapper
49const int FIELD_ID_DATA = 1;
50// for CountMetricData
51const int FIELD_ID_DIMENSION = 1;
52const int FIELD_ID_BUCKET_INFO = 2;
53// for KeyValuePair
54const int FIELD_ID_KEY = 1;
55const int FIELD_ID_VALUE_STR = 2;
56const int FIELD_ID_VALUE_INT = 3;
57const int FIELD_ID_VALUE_BOOL = 4;
58const int FIELD_ID_VALUE_FLOAT = 5;
59// for CountBucketInfo
60const int FIELD_ID_START_BUCKET_NANOS = 1;
61const int FIELD_ID_END_BUCKET_NANOS = 2;
62const int FIELD_ID_COUNT = 3;
63
Yao Chen729093d2017-10-16 10:33:26 -070064// TODO: add back AnomalyTracker.
Yang Lu3eba6212017-10-25 19:54:45 -070065
Yao Chen729093d2017-10-16 10:33:26 -070066CountMetricProducer::CountMetricProducer(const CountMetric& metric, const int conditionIndex,
Yao Chen93fe3a32017-11-02 13:52:59 -070067 const sp<ConditionWizard>& wizard,
68 const uint64_t startTimeNs)
69 : MetricProducer(startTimeNs, conditionIndex, wizard), mMetric(metric) {
Yao Chen44cf27c2017-09-14 22:32:50 -070070 // TODO: evaluate initial conditions. and set mConditionMet.
71 if (metric.has_bucket() && metric.bucket().has_bucket_size_millis()) {
Yao Chen729093d2017-10-16 10:33:26 -070072 mBucketSizeNs = metric.bucket().bucket_size_millis() * 1000 * 1000;
Yao Chen44cf27c2017-09-14 22:32:50 -070073 } else {
Yao Chen729093d2017-10-16 10:33:26 -070074 mBucketSizeNs = LLONG_MAX;
Yao Chen44cf27c2017-09-14 22:32:50 -070075 }
76
Bookatzd3606c72017-10-19 10:13:49 -070077 mAnomalyTrackers.reserve(metric.alerts_size());
78 for (int i = 0; i < metric.alerts_size(); i++) {
79 const Alert& alert = metric.alerts(i);
80 if (alert.trigger_if_sum_gt() > 0 && alert.number_of_buckets() > 0) {
Yang Lu3eba6212017-10-25 19:54:45 -070081 mAnomalyTrackers.push_back(std::make_unique<DiscreteAnomalyTracker>(alert));
Bookatzd3606c72017-10-19 10:13:49 -070082 } else {
83 ALOGW("Ignoring invalid count metric alert: threshold=%lld num_buckets= %d",
84 alert.trigger_if_sum_gt(), alert.number_of_buckets());
85 }
86 }
87
Yao Chen729093d2017-10-16 10:33:26 -070088 // TODO: use UidMap if uid->pkg_name is required
89 mDimension.insert(mDimension.begin(), metric.dimension().begin(), metric.dimension().end());
90
91 if (metric.links().size() > 0) {
92 mConditionLinks.insert(mConditionLinks.begin(), metric.links().begin(),
93 metric.links().end());
94 mConditionSliced = true;
95 }
96
yro24809bd2017-10-31 23:06:53 -070097 startNewProtoOutputStream(mStartTimeNs);
98
Yao Chen729093d2017-10-16 10:33:26 -070099 VLOG("metric %lld created. bucket size %lld start_time: %lld", metric.metric_id(),
100 (long long)mBucketSizeNs, (long long)mStartTimeNs);
Yao Chen44cf27c2017-09-14 22:32:50 -0700101}
102
Yao Chen44cf27c2017-09-14 22:32:50 -0700103CountMetricProducer::~CountMetricProducer() {
104 VLOG("~CountMetricProducer() called");
105}
106
yro24809bd2017-10-31 23:06:53 -0700107void CountMetricProducer::startNewProtoOutputStream(long long startTime) {
108 mProto = std::make_unique<ProtoOutputStream>();
109 mProto->write(FIELD_TYPE_INT32 | FIELD_ID_METRIC_ID, mMetric.metric_id());
110 mProto->write(FIELD_TYPE_INT64 | FIELD_ID_START_REPORT_NANOS, startTime);
111 mProtoToken = mProto->start(FIELD_TYPE_MESSAGE | FIELD_ID_COUNT_METRICS);
Yao Chen44cf27c2017-09-14 22:32:50 -0700112}
113
yro24809bd2017-10-31 23:06:53 -0700114void CountMetricProducer::finish() {
Yao Chen729093d2017-10-16 10:33:26 -0700115}
116
Yao Chen5154a372017-10-30 22:57:06 -0700117void CountMetricProducer::onSlicedConditionMayChange(const uint64_t eventTime) {
Yao Chen729093d2017-10-16 10:33:26 -0700118 VLOG("Metric %lld onSlicedConditionMayChange", mMetric.metric_id());
119}
120
yro17adac92017-11-08 23:16:29 -0800121std::unique_ptr<std::vector<uint8_t>> CountMetricProducer::onDumpReport() {
Yao Chen93fe3a32017-11-02 13:52:59 -0700122 long long endTime = time(nullptr) * NS_PER_SEC;
Yao Chen729093d2017-10-16 10:33:26 -0700123
124 // Dump current bucket if it's stale.
125 // If current bucket is still on-going, don't force dump current bucket.
126 // In finish(), We can force dump current bucket.
yro24809bd2017-10-31 23:06:53 -0700127 flushCounterIfNeeded(endTime);
Yao Chen93fe3a32017-11-02 13:52:59 -0700128 VLOG("metric %lld dump report now...", mMetric.metric_id());
Yao Chen729093d2017-10-16 10:33:26 -0700129
Yao Chen93fe3a32017-11-02 13:52:59 -0700130 for (const auto& counter : mPastBuckets) {
yro24809bd2017-10-31 23:06:53 -0700131 const HashableDimensionKey& hashableKey = counter.first;
Yao Chen93fe3a32017-11-02 13:52:59 -0700132 VLOG(" dimension key %s", hashableKey.c_str());
Yao Chen729093d2017-10-16 10:33:26 -0700133 auto it = mDimensionKeyMap.find(hashableKey);
134 if (it == mDimensionKeyMap.end()) {
135 ALOGE("Dimension key %s not found?!?! skip...", hashableKey.c_str());
136 continue;
137 }
yrob0378b02017-11-09 20:36:25 -0800138 long long wrapperToken =
139 mProto->start(FIELD_TYPE_MESSAGE | FIELD_COUNT_REPEATED | FIELD_ID_DATA);
Yao Chen729093d2017-10-16 10:33:26 -0700140
yro24809bd2017-10-31 23:06:53 -0700141 // First fill dimension (KeyValuePairs).
142 for (const auto& kv : it->second) {
yrob0378b02017-11-09 20:36:25 -0800143 long long dimensionToken =
144 mProto->start(FIELD_TYPE_MESSAGE | FIELD_COUNT_REPEATED | FIELD_ID_DIMENSION);
yro24809bd2017-10-31 23:06:53 -0700145 mProto->write(FIELD_TYPE_INT32 | FIELD_ID_KEY, kv.key());
146 if (kv.has_value_str()) {
147 mProto->write(FIELD_TYPE_INT32 | FIELD_ID_VALUE_STR, kv.value_str());
148 } else if (kv.has_value_int()) {
149 mProto->write(FIELD_TYPE_INT64 | FIELD_ID_VALUE_INT, kv.value_int());
150 } else if (kv.has_value_bool()) {
151 mProto->write(FIELD_TYPE_BOOL | FIELD_ID_VALUE_BOOL, kv.value_bool());
152 } else if (kv.has_value_float()) {
153 mProto->write(FIELD_TYPE_FLOAT | FIELD_ID_VALUE_FLOAT, kv.value_float());
154 }
155 mProto->end(dimensionToken);
156 }
157
158 // Then fill bucket_info (CountBucketInfo).
Yao Chen93fe3a32017-11-02 13:52:59 -0700159 for (const auto& bucket : counter.second) {
yrob0378b02017-11-09 20:36:25 -0800160 long long bucketInfoToken =
161 mProto->start(FIELD_TYPE_MESSAGE | FIELD_COUNT_REPEATED | FIELD_ID_BUCKET_INFO);
Yao Chen93fe3a32017-11-02 13:52:59 -0700162 mProto->write(FIELD_TYPE_INT64 | FIELD_ID_START_BUCKET_NANOS,
163 (long long)bucket.mBucketStartNs);
164 mProto->write(FIELD_TYPE_INT64 | FIELD_ID_END_BUCKET_NANOS,
165 (long long)bucket.mBucketEndNs);
166 mProto->write(FIELD_TYPE_INT64 | FIELD_ID_COUNT, (long long)bucket.mCount);
167 mProto->end(bucketInfoToken);
168 VLOG("\t bucket [%lld - %lld] count: %lld", (long long)bucket.mBucketStartNs,
169 (long long)bucket.mBucketEndNs, (long long)bucket.mCount);
yro24809bd2017-10-31 23:06:53 -0700170 }
yro24809bd2017-10-31 23:06:53 -0700171 mProto->end(wrapperToken);
Yao Chen729093d2017-10-16 10:33:26 -0700172 }
yro24809bd2017-10-31 23:06:53 -0700173
174 mProto->end(mProtoToken);
175 mProto->write(FIELD_TYPE_INT64 | FIELD_ID_END_REPORT_NANOS,
176 (long long)mCurrentBucketStartTimeNs);
177
yro2b0f8862017-11-06 14:27:31 -0800178 VLOG("metric %lld dump report now...", mMetric.metric_id());
yro17adac92017-11-08 23:16:29 -0800179 std::unique_ptr<std::vector<uint8_t>> buffer = serializeProto();
yro24809bd2017-10-31 23:06:53 -0700180
181 startNewProtoOutputStream(endTime);
Yao Chen93fe3a32017-11-02 13:52:59 -0700182 mPastBuckets.clear();
yro24809bd2017-10-31 23:06:53 -0700183 mByteSize = 0;
184
yro17adac92017-11-08 23:16:29 -0800185 return buffer;
yro24809bd2017-10-31 23:06:53 -0700186
187 // TODO: Clear mDimensionKeyMap once the report is dumped.
Yao Chen44cf27c2017-09-14 22:32:50 -0700188}
189
Yao Chen5154a372017-10-30 22:57:06 -0700190void CountMetricProducer::onConditionChanged(const bool conditionMet, const uint64_t eventTime) {
Yao Chen729093d2017-10-16 10:33:26 -0700191 VLOG("Metric %lld onConditionChanged", mMetric.metric_id());
Yao Chencaf339d2017-10-06 16:01:10 -0700192 mCondition = conditionMet;
193}
194
Yao Chenb7041772017-10-20 16:59:25 -0700195void CountMetricProducer::onMatchedLogEventInternal(
196 const size_t matcherIndex, const HashableDimensionKey& eventKey,
197 const map<string, HashableDimensionKey>& conditionKey, bool condition,
Chenjie Yub3dda412017-10-24 13:41:59 -0700198 const LogEvent& event, bool scheduledPull) {
Yao Chen729093d2017-10-16 10:33:26 -0700199 uint64_t eventTimeNs = event.GetTimestampNs();
Yao Chen44cf27c2017-09-14 22:32:50 -0700200
Yao Chen729093d2017-10-16 10:33:26 -0700201 flushCounterIfNeeded(eventTimeNs);
202
Yao Chenb7041772017-10-20 16:59:25 -0700203 if (condition == false) {
204 return;
Yao Chen44cf27c2017-09-14 22:32:50 -0700205 }
Yao Chen729093d2017-10-16 10:33:26 -0700206
Yang Lu3eba6212017-10-25 19:54:45 -0700207 auto it = mCurrentSlicedCounter->find(eventKey);
Yao Chen729093d2017-10-16 10:33:26 -0700208
Yang Lu3eba6212017-10-25 19:54:45 -0700209 if (it == mCurrentSlicedCounter->end()) {
Yao Chen729093d2017-10-16 10:33:26 -0700210 // create a counter for the new key
Yang Lu3eba6212017-10-25 19:54:45 -0700211 (*mCurrentSlicedCounter)[eventKey] = 1;
Yao Chen729093d2017-10-16 10:33:26 -0700212 } else {
213 // increment the existing value
214 auto& count = it->second;
215 count++;
216 }
217
Yao Chenb7041772017-10-20 16:59:25 -0700218 VLOG("metric %lld %s->%d", mMetric.metric_id(), eventKey.c_str(),
Yang Lu3eba6212017-10-25 19:54:45 -0700219 (*mCurrentSlicedCounter)[eventKey]);
Yao Chen44cf27c2017-09-14 22:32:50 -0700220}
221
Yao Chen729093d2017-10-16 10:33:26 -0700222// When a new matched event comes in, we check if event falls into the current
223// bucket. If not, flush the old counter to past buckets and initialize the new bucket.
224void CountMetricProducer::flushCounterIfNeeded(const uint64_t eventTimeNs) {
225 if (mCurrentBucketStartTimeNs + mBucketSizeNs > eventTimeNs) {
Yao Chen44cf27c2017-09-14 22:32:50 -0700226 return;
227 }
228
Yao Chen44cf27c2017-09-14 22:32:50 -0700229 // adjust the bucket start time
Yang Lu3eba6212017-10-25 19:54:45 -0700230 // TODO: This (and addPastBucket to which it goes) doesn't really need to be an int64.
231 uint64_t numBucketsForward = (eventTimeNs - mCurrentBucketStartTimeNs) / mBucketSizeNs;
Bookatza4bc9c42017-10-04 11:45:57 -0700232
Yao Chen93fe3a32017-11-02 13:52:59 -0700233 CountBucket info;
234 info.mBucketStartNs = mCurrentBucketStartTimeNs;
235 info.mBucketEndNs = mCurrentBucketStartTimeNs + mBucketSizeNs;
Yang Lu3eba6212017-10-25 19:54:45 -0700236 for (const auto& counter : *mCurrentSlicedCounter) {
Yao Chen93fe3a32017-11-02 13:52:59 -0700237 info.mCount = counter.second;
238 auto& bucketList = mPastBuckets[counter.first];
239 bucketList.push_back(info);
Yao Chen729093d2017-10-16 10:33:26 -0700240 VLOG("metric %lld, dump key value: %s -> %d", mMetric.metric_id(), counter.first.c_str(),
241 counter.second);
Yao Chen93fe3a32017-11-02 13:52:59 -0700242 mByteSize += sizeof(info);
Yao Chen729093d2017-10-16 10:33:26 -0700243 }
244
Yang Lu3eba6212017-10-25 19:54:45 -0700245 for (auto& tracker : mAnomalyTrackers) {
246 tracker->addOrUpdateBucket(mCurrentSlicedCounter, mCurrentBucketNum);
247 tracker->declareAndDeclareAnomaly();
248 }
Bookatzd3606c72017-10-19 10:13:49 -0700249
Yang Lu3eba6212017-10-25 19:54:45 -0700250 // Reset counters (do not clear, since the old one is still referenced in mAnomalyTrackers).
251 mCurrentSlicedCounter = std::make_shared<DimToValMap>();
Yao Chen729093d2017-10-16 10:33:26 -0700252
253 mCurrentBucketStartTimeNs = mCurrentBucketStartTimeNs + numBucketsForward * mBucketSizeNs;
Yang Lu3eba6212017-10-25 19:54:45 -0700254 mCurrentBucketNum += numBucketsForward;
Yao Chen729093d2017-10-16 10:33:26 -0700255 VLOG("metric %lld: new bucket start time: %lld", mMetric.metric_id(),
256 (long long)mCurrentBucketStartTimeNs);
Yao Chen44cf27c2017-09-14 22:32:50 -0700257}
258
yro24809bd2017-10-31 23:06:53 -0700259// Rough estimate of CountMetricProducer buffer stored. This number will be
260// greater than actual data size as it contains each dimension of
261// CountMetricData is duplicated.
yro69007c82017-10-26 20:42:57 -0700262size_t CountMetricProducer::byteSize() {
yro24809bd2017-10-31 23:06:53 -0700263 return mByteSize;
yro69007c82017-10-26 20:42:57 -0700264}
265
Yao Chen44cf27c2017-09-14 22:32:50 -0700266} // namespace statsd
267} // namespace os
yro69007c82017-10-26 20:42:57 -0700268} // namespace android