b0dc10ebed9e1d24faedd08b59fa4c2480d1e9a3
[lhc/web/wiklou.git] / includes / libs / rdbms / ChronologyProtector.php
1 <?php
2 /**
3 * Generator of database load balancing objects.
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
9 *
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
19 *
20 * @file
21 * @ingroup Database
22 */
23
24 namespace Wikimedia\Rdbms;
25
26 use Psr\Log\LoggerAwareInterface;
27 use Psr\Log\LoggerInterface;
28 use Psr\Log\NullLogger;
29 use Wikimedia\WaitConditionLoop;
30 use BagOStuff;
31
32 /**
33 * Class for ensuring a consistent ordering of events as seen by the user, despite replication.
34 * Kind of like Hawking's [[Chronology Protection Agency]].
35 */
36 class ChronologyProtector implements LoggerAwareInterface {
37 /** @var BagOStuff */
38 protected $store;
39 /** @var LoggerInterface */
40 protected $logger;
41
42 /** @var string Storage key name */
43 protected $key;
44 /** @var string Hash of client parameters */
45 protected $clientId;
46 /** @var string[] Map of client information fields for logging */
47 protected $clientLogInfo;
48 /** @var int|null Expected minimum index of the last write to the position store */
49 protected $waitForPosIndex;
50 /** @var int Max seconds to wait on positions to appear */
51 protected $waitForPosStoreTimeout = self::POS_STORE_WAIT_TIMEOUT;
52 /** @var bool Whether to no-op all method calls */
53 protected $enabled = true;
54 /** @var bool Whether to check and wait on positions */
55 protected $wait = true;
56
57 /** @var bool Whether the client data was loaded */
58 protected $initialized = false;
59 /** @var DBMasterPos[] Map of (DB master name => position) */
60 protected $startupPositions = [];
61 /** @var DBMasterPos[] Map of (DB master name => position) */
62 protected $shutdownPositions = [];
63 /** @var float[] Map of (DB master name => 1) */
64 protected $shutdownTouchDBs = [];
65
66 /** @var int Seconds to store positions */
67 const POSITION_TTL = 60;
68 /** @var int Seconds to store position write index cookies (safely less than POSITION_TTL) */
69 const POSITION_COOKIE_TTL = 60;
70 /** @var int Max time to wait for positions to appear */
71 const POS_STORE_WAIT_TIMEOUT = 5;
72
73 /**
74 * @param BagOStuff $store
75 * @param array[] $client Map of (ip: <IP>, agent: <user-agent> [, clientId: <hash>] )
76 * @param int|null $posIndex Write counter index [optional]
77 * @since 1.27
78 */
79 public function __construct( BagOStuff $store, array $client, $posIndex = null ) {
80 $this->store = $store;
81 $this->clientId = isset( $client['clientId'] )
82 ? $client['clientId']
83 : md5( $client['ip'] . "\n" . $client['agent'] );
84 $this->key = $store->makeGlobalKey( __CLASS__, $this->clientId, 'v2' );
85 $this->waitForPosIndex = $posIndex;
86
87 $this->clientLogInfo = [
88 'clientIP' => $client['ip'],
89 'clientAgent' => $client['agent'],
90 'clientId' => $client['clientId'] ?? null
91 ];
92
93 $this->logger = new NullLogger();
94 }
95
96 public function setLogger( LoggerInterface $logger ) {
97 $this->logger = $logger;
98 }
99
100 /**
101 * @return string Client ID hash
102 * @since 1.32
103 */
104 public function getClientId() {
105 return $this->clientId;
106 }
107
108 /**
109 * @param bool $enabled Whether to no-op all method calls
110 * @since 1.27
111 */
112 public function setEnabled( $enabled ) {
113 $this->enabled = $enabled;
114 }
115
116 /**
117 * @param bool $enabled Whether to check and wait on positions
118 * @since 1.27
119 */
120 public function setWaitEnabled( $enabled ) {
121 $this->wait = $enabled;
122 }
123
124 /**
125 * Initialise a ILoadBalancer to give it appropriate chronology protection.
126 *
127 * If the stash has a previous master position recorded, this will try to
128 * make sure that the next query to a replica DB of that master will see changes up
129 * to that position by delaying execution. The delay may timeout and allow stale
130 * data if no non-lagged replica DBs are available.
131 *
132 * @param ILoadBalancer $lb
133 * @return void
134 */
135 public function initLB( ILoadBalancer $lb ) {
136 if ( !$this->enabled || $lb->getServerCount() <= 1 ) {
137 return; // non-replicated setup or disabled
138 }
139
140 $this->initPositions();
141
142 $masterName = $lb->getServerName( $lb->getWriterIndex() );
143 if (
144 isset( $this->startupPositions[$masterName] ) &&
145 $this->startupPositions[$masterName] instanceof DBMasterPos
146 ) {
147 $pos = $this->startupPositions[$masterName];
148 $this->logger->debug( __METHOD__ . ": LB for '$masterName' set to pos $pos\n" );
149 $lb->waitFor( $pos );
150 }
151 }
152
153 /**
154 * Notify the ChronologyProtector that the ILoadBalancer is about to shut
155 * down. Saves replication positions.
156 *
157 * @param ILoadBalancer $lb
158 * @return void
159 */
160 public function shutdownLB( ILoadBalancer $lb ) {
161 if ( !$this->enabled ) {
162 return; // not enabled
163 } elseif ( !$lb->hasOrMadeRecentMasterChanges( INF ) ) {
164 // Only save the position if writes have been done on the connection
165 return;
166 }
167
168 $masterName = $lb->getServerName( $lb->getWriterIndex() );
169 if ( $lb->getServerCount() > 1 ) {
170 $pos = $lb->getMasterPos();
171 if ( $pos ) {
172 $this->logger->debug( __METHOD__ . ": LB for '$masterName' has pos $pos\n" );
173 $this->shutdownPositions[$masterName] = $pos;
174 }
175 } else {
176 $this->logger->debug( __METHOD__ . ": DB '$masterName' touched\n" );
177 }
178 $this->shutdownTouchDBs[$masterName] = 1;
179 }
180
181 /**
182 * Notify the ChronologyProtector that the LBFactory is done calling shutdownLB() for now.
183 * May commit chronology data to persistent storage.
184 *
185 * @param callable|null $workCallback Work to do instead of waiting on syncing positions
186 * @param string $mode One of (sync, async); whether to wait on remote datacenters
187 * @param int|null &$cpIndex DB position key write counter; incremented on update
188 * @return DBMasterPos[] Empty on success; returns the (db name => position) map on failure
189 */
190 public function shutdown( callable $workCallback = null, $mode = 'sync', &$cpIndex = null ) {
191 if ( !$this->enabled ) {
192 return [];
193 }
194
195 $store = $this->store;
196 // Some callers might want to know if a user recently touched a DB.
197 // These writes do not need to block on all datacenters receiving them.
198 foreach ( $this->shutdownTouchDBs as $dbName => $unused ) {
199 $store->set(
200 $this->getTouchedKey( $this->store, $dbName ),
201 microtime( true ),
202 $store::TTL_DAY
203 );
204 }
205
206 if ( !count( $this->shutdownPositions ) ) {
207 return []; // nothing to save
208 }
209
210 $this->logger->debug( __METHOD__ . ": saving master pos for " .
211 implode( ', ', array_keys( $this->shutdownPositions ) ) . "\n"
212 );
213
214 // CP-protected writes should overwhelmingly go to the master datacenter, so use a
215 // DC-local lock to merge the values. Use a DC-local get() and a synchronous all-DC
216 // set(). This makes it possible for the BagOStuff class to write in parallel to all
217 // DCs with one RTT. The use of WRITE_SYNC avoids needing READ_LATEST for the get().
218 if ( $store->lock( $this->key, 3 ) ) {
219 if ( $workCallback ) {
220 // Let the store run the work before blocking on a replication sync barrier.
221 // If replication caught up while the work finished, the barrier will be fast.
222 $store->addBusyCallback( $workCallback );
223 }
224 $ok = $store->set(
225 $this->key,
226 $this->mergePositions(
227 $store->get( $this->key ),
228 $this->shutdownPositions,
229 $cpIndex
230 ),
231 self::POSITION_TTL,
232 ( $mode === 'sync' ) ? $store::WRITE_SYNC : 0
233 );
234 $store->unlock( $this->key );
235 } else {
236 $ok = false;
237 }
238
239 if ( !$ok ) {
240 $cpIndex = null; // nothing saved
241 $bouncedPositions = $this->shutdownPositions;
242 // Raced out too many times or stash is down
243 $this->logger->warning( __METHOD__ . ": failed to save master pos for " .
244 implode( ', ', array_keys( $this->shutdownPositions ) ) . "\n"
245 );
246 } elseif ( $mode === 'sync' &&
247 $store->getQoS( $store::ATTR_SYNCWRITES ) < $store::QOS_SYNCWRITES_BE
248 ) {
249 // Positions may not be in all datacenters, force LBFactory to play it safe
250 $this->logger->info( __METHOD__ . ": store may not support synchronous writes." );
251 $bouncedPositions = $this->shutdownPositions;
252 } else {
253 $bouncedPositions = [];
254 }
255
256 return $bouncedPositions;
257 }
258
259 /**
260 * @param string $dbName DB master name (e.g. "db1052")
261 * @return float|bool UNIX timestamp when client last touched the DB; false if not on record
262 * @since 1.28
263 */
264 public function getTouched( $dbName ) {
265 return $this->store->get( $this->getTouchedKey( $this->store, $dbName ) );
266 }
267
268 /**
269 * @param BagOStuff $store
270 * @param string $dbName
271 * @return string
272 */
273 private function getTouchedKey( BagOStuff $store, $dbName ) {
274 return $store->makeGlobalKey( __CLASS__, 'mtime', $this->clientId, $dbName );
275 }
276
277 /**
278 * Load in previous master positions for the client
279 */
280 protected function initPositions() {
281 if ( $this->initialized ) {
282 return;
283 }
284
285 $this->initialized = true;
286 if ( $this->wait ) {
287 // If there is an expectation to see master positions from a certain write
288 // index or higher, then block until it appears, or until a timeout is reached.
289 // Since the write index restarts each time the key is created, it is possible that
290 // a lagged store has a matching key write index. However, in that case, it should
291 // already be expired and thus treated as non-existing, maintaining correctness.
292 if ( $this->waitForPosIndex > 0 ) {
293 $data = null;
294 $indexReached = null; // highest index reached in the position store
295 $loop = new WaitConditionLoop(
296 function () use ( &$data, &$indexReached ) {
297 $data = $this->store->get( $this->key );
298 if ( !is_array( $data ) ) {
299 return WaitConditionLoop::CONDITION_CONTINUE; // not found yet
300 } elseif ( !isset( $data['writeIndex'] ) ) {
301 return WaitConditionLoop::CONDITION_REACHED; // b/c
302 }
303 $indexReached = max( $data['writeIndex'], $indexReached );
304
305 return ( $data['writeIndex'] >= $this->waitForPosIndex )
306 ? WaitConditionLoop::CONDITION_REACHED
307 : WaitConditionLoop::CONDITION_CONTINUE;
308 },
309 $this->waitForPosStoreTimeout
310 );
311 $result = $loop->invoke();
312 $waitedMs = $loop->getLastWaitTime() * 1e3;
313
314 if ( $result == $loop::CONDITION_REACHED ) {
315 $this->logger->debug(
316 __METHOD__ . ": expected and found position index.",
317 [
318 'cpPosIndex' => $this->waitForPosIndex,
319 'waitTimeMs' => $waitedMs
320 ] + $this->clientLogInfo
321 );
322 } else {
323 $this->logger->warning(
324 __METHOD__ . ": expected but failed to find position index.",
325 [
326 'cpPosIndex' => $this->waitForPosIndex,
327 'indexReached' => $indexReached,
328 'waitTimeMs' => $waitedMs
329 ] + $this->clientLogInfo
330 );
331 }
332 } else {
333 $data = $this->store->get( $this->key );
334 }
335
336 $this->startupPositions = $data ? $data['positions'] : [];
337 $this->logger->debug( __METHOD__ . ": key is {$this->key} (read)\n" );
338 } else {
339 $this->startupPositions = [];
340 $this->logger->debug( __METHOD__ . ": key is {$this->key} (unread)\n" );
341 }
342 }
343
344 /**
345 * @param array|bool $curValue
346 * @param DBMasterPos[] $shutdownPositions
347 * @param int|null &$cpIndex
348 * @return array
349 */
350 protected function mergePositions( $curValue, array $shutdownPositions, &$cpIndex = null ) {
351 /** @var DBMasterPos[] $curPositions */
352 $curPositions = $curValue['positions'] ?? [];
353 // Use the newest positions for each DB master
354 foreach ( $shutdownPositions as $db => $pos ) {
355 if (
356 !isset( $curPositions[$db] ) ||
357 !( $curPositions[$db] instanceof DBMasterPos ) ||
358 $pos->asOfTime() > $curPositions[$db]->asOfTime()
359 ) {
360 $curPositions[$db] = $pos;
361 }
362 }
363
364 $cpIndex = $curValue['writeIndex'] ?? 0;
365
366 return [
367 'positions' => $curPositions,
368 'writeIndex' => ++$cpIndex
369 ];
370 }
371 }