blob: 074e5a304f065f2b05c64d82e6be89e254eb365d [file] [log] [blame]
Paul Stewart3f43f432012-07-16 12:12:45 -07001// Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style license that can be
3// found in the LICENSE file.
4
Paul Stewart6c72c972012-07-27 11:29:20 -07005#ifndef SHILL_LINK_MONITOR_H_
6#define SHILL_LINK_MONITOR_H_
7
8#include <time.h>
Paul Stewart3f43f432012-07-16 12:12:45 -07009
10#include <base/callback.h>
Paul Stewart6c72c972012-07-27 11:29:20 -070011#include <base/cancelable_callback.h>
Paul Stewart3f43f432012-07-16 12:12:45 -070012#include <base/memory/scoped_ptr.h>
13
Paul Stewart6c72c972012-07-27 11:29:20 -070014#include "shill/byte_string.h"
Paul Stewart3f43f432012-07-16 12:12:45 -070015#include "shill/refptr_types.h"
16
17namespace shill {
18
Paul Stewart6c72c972012-07-27 11:29:20 -070019class ArpClient;
20class DeviceInfo;
Paul Stewart3f43f432012-07-16 12:12:45 -070021class EventDispatcher;
Paul Stewart6c72c972012-07-27 11:29:20 -070022class IOHandler;
Paul Stewartff845fc2012-08-07 07:28:44 -070023class Metrics;
Paul Stewart6c72c972012-07-27 11:29:20 -070024class Time;
Paul Stewart3f43f432012-07-16 12:12:45 -070025
26// LinkMonitor tracks the status of a connection by sending ARP
27// messages to the default gateway for a connection. It keeps
Paul Stewart6c72c972012-07-27 11:29:20 -070028// track of response times which can be an indicator of link
29// quality. It signals to caller that the link has failed if
30// too many requests go unanswered.
Paul Stewart3f43f432012-07-16 12:12:45 -070031class LinkMonitor {
32 public:
Paul Stewart6c72c972012-07-27 11:29:20 -070033 typedef base::Closure FailureCallback;
Paul Stewart3f43f432012-07-16 12:12:45 -070034
Paul Stewart0443aa52012-08-09 10:43:50 -070035 // When the sum of consecutive unicast and broadcast failures
36 // equals this value, the failure callback is called, the counters
37 // are reset, and the link monitoring quiesces. Needed by Metrics.
Paul Stewartf1961f82012-09-11 20:45:39 -070038 static const int kFailureThreshold;
Paul Stewart0443aa52012-08-09 10:43:50 -070039
Paul Stewartff845fc2012-08-07 07:28:44 -070040 // The number of milliseconds between ARP requests. Needed by Metrics.
Paul Stewartf1961f82012-09-11 20:45:39 -070041 static const int kTestPeriodMilliseconds;
Paul Stewartff845fc2012-08-07 07:28:44 -070042
Paul Stewart036dba02012-08-07 12:34:41 -070043 // The default list of technologies for which link monitoring is enabled.
44 static const char kDefaultLinkMonitorTechnologies[];
45
Paul Stewart3f43f432012-07-16 12:12:45 -070046 LinkMonitor(const ConnectionRefPtr &connection,
Paul Stewartf1961f82012-09-11 20:45:39 -070047 EventDispatcher *dispatcher, // Owned by caller; can't be NULL.
48 Metrics *metrics, // Owned by caller; must not be NULL.
Paul Stewart6c72c972012-07-27 11:29:20 -070049 DeviceInfo *device_info,
Paul Stewart3f43f432012-07-16 12:12:45 -070050 const FailureCallback &failure_callback);
51 virtual ~LinkMonitor();
52
Paul Stewart6c72c972012-07-27 11:29:20 -070053 // Starts link-monitoring on the selected connection. Returns
54 // true if successful, false otherwise.
55 virtual bool Start();
56 virtual void Stop();
57
58 // Return modified cumulative average of the gateway ARP response
59 // time. Returns zero if no samples are available. For each
60 // missed ARP response, the sample is assumed to be the full
61 // test period.
Paul Stewartf1961f82012-09-11 20:45:39 -070062 virtual int GetResponseTimeMilliseconds() const;
Paul Stewart9f7823e2012-08-09 10:58:26 -070063
64 // Returns true if the LinkMonitor was ever able to find the default
65 // gateway via broadcast ARP.
66 virtual bool IsGatewayFound() const;
Paul Stewart3f43f432012-07-16 12:12:45 -070067
68 private:
Paul Stewart6c72c972012-07-27 11:29:20 -070069 friend class LinkMonitorForTest;
70 friend class LinkMonitorTest;
71
Paul Stewart6c72c972012-07-27 11:29:20 -070072 // The number of samples to compute a "strict" average over. When
73 // more samples than this number arrive, this determines how "slow"
74 // our simple low-pass filter works.
Paul Stewartf1961f82012-09-11 20:45:39 -070075 static const int kMaxResponseSampleFilterDepth;
Paul Stewart6c72c972012-07-27 11:29:20 -070076
77 // Add a response time sample to the buffer.
Paul Stewartf1961f82012-09-11 20:45:39 -070078 void AddResponseTimeSample(int response_time_milliseconds);
Paul Stewart6c72c972012-07-27 11:29:20 -070079 // Create an ArpClient instance so we can receive and transmit ARP
80 // packets. This method is virtual so it can be overridden in
81 // unit tests.
82 virtual bool CreateClient();
83 // Convert a hardware address byte-string to a colon-separated string.
84 static std::string HardwareAddressToString(const ByteString &address);
85 // Denote a missed response. Returns true if this loss has caused us
86 // to exceed the failure threshold.
87 bool AddMissedResponse();
88 // This I/O callback is triggered whenever the ARP reception socket
89 // has data available to be received.
90 void ReceiveResponse(int fd);
91 // Send the next ARP request. Returns true if successful, false
92 // otherwise.
93 bool SendRequest();
Paul Stewart6c72c972012-07-27 11:29:20 -070094
Paul Stewartf1961f82012-09-11 20:45:39 -070095 // The connection on which to perform link monitoring.
Paul Stewart3f43f432012-07-16 12:12:45 -070096 ConnectionRefPtr connection_;
Paul Stewartf1961f82012-09-11 20:45:39 -070097 // Dispatcher on which to create delayed tasks.
Paul Stewart3f43f432012-07-16 12:12:45 -070098 EventDispatcher *dispatcher_;
Paul Stewartf1961f82012-09-11 20:45:39 -070099 // Metrics instance on which to post performance results.
Paul Stewartff845fc2012-08-07 07:28:44 -0700100 Metrics *metrics_;
Paul Stewartf1961f82012-09-11 20:45:39 -0700101 // DeviceInfo instance for retrieving the MAC address of a device.
Paul Stewart6c72c972012-07-27 11:29:20 -0700102 DeviceInfo *device_info_;
Paul Stewartf1961f82012-09-11 20:45:39 -0700103 // Failure callback method to call if LinkMonitor fails.
Paul Stewart3f43f432012-07-16 12:12:45 -0700104 FailureCallback failure_callback_;
Paul Stewartf1961f82012-09-11 20:45:39 -0700105 // The MAC address of device associated with this connection.
Paul Stewart6c72c972012-07-27 11:29:20 -0700106 ByteString local_mac_address_;
Paul Stewartf1961f82012-09-11 20:45:39 -0700107 // The MAC address of the default gateway.
Paul Stewart6c72c972012-07-27 11:29:20 -0700108 ByteString gateway_mac_address_;
Paul Stewartf1961f82012-09-11 20:45:39 -0700109 // ArpClient instance used for performing link tests.
Paul Stewart6c72c972012-07-27 11:29:20 -0700110 scoped_ptr<ArpClient> arp_client_;
111
112 // The number of consecutive times we have failed in receiving
113 // responses to broadcast ARP requests.
Paul Stewartf1961f82012-09-11 20:45:39 -0700114 int broadcast_failure_count_;
Paul Stewart6c72c972012-07-27 11:29:20 -0700115 // The number of consecutive times we have failed in receiving
116 // responses to unicast ARP requests.
Paul Stewartf1961f82012-09-11 20:45:39 -0700117 int unicast_failure_count_;
Paul Stewart6c72c972012-07-27 11:29:20 -0700118
119 // Whether this iteration of the test was a unicast request
120 // to the gateway instead of broadcast. The link monitor
121 // alternates between unicast and broadcast requests so that
122 // both types of network traffic is monitored.
123 bool is_unicast_;
124
Paul Stewartf1961f82012-09-11 20:45:39 -0700125 // Number of response samples received in our rolling averge.
126 int response_sample_count_;
127 // The sum of response samples in our rolling average.
128 int response_sample_bucket_;
Paul Stewart6c72c972012-07-27 11:29:20 -0700129
Paul Stewartf1961f82012-09-11 20:45:39 -0700130 // IOCallback that fires when the socket associated with our ArpClient
131 // has a packet to be received. Calls ReceiveResponse().
Paul Stewart6c72c972012-07-27 11:29:20 -0700132 scoped_ptr<IOHandler> receive_response_handler_;
133 // Callback method used for periodic transmission of ARP requests.
134 // When the timer expires this will call SendRequest() through the
135 // void callback function SendRequestTask().
136 base::CancelableClosure send_request_callback_;
137
Paul Stewart0443aa52012-08-09 10:43:50 -0700138 // The time at which the link monitor started.
139 struct timeval started_monitoring_at_;
140
Paul Stewart6c72c972012-07-27 11:29:20 -0700141 // The time at which the last ARP request was sent.
142 struct timeval sent_request_at_;
Paul Stewartf1961f82012-09-11 20:45:39 -0700143 // Time instance for performing GetTimeMonotonic().
Paul Stewart6c72c972012-07-27 11:29:20 -0700144 Time *time_;
Paul Stewart3f43f432012-07-16 12:12:45 -0700145
146 DISALLOW_COPY_AND_ASSIGN(LinkMonitor);
147};
148
149} // namespace shill
150
Paul Stewart6c72c972012-07-27 11:29:20 -0700151#endif // SHILL_LINK_MONITOR_H_