Merge "API: Properly handle limit and continuation for generator=prefixsearch"
[mediawiki.git] / includes / libs / virtualrest / VirtualRESTServiceClient.php
blobe8bb38d89b47d27efbba43607267549a5e0e4de8
1 <?php
2 /**
3 * Virtual HTTP service client
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
7 * the Free Software Foundation; either version 2 of the License, or
8 * (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
15 * You should have received a copy of the GNU General Public License along
16 * with this program; if not, write to the Free Software Foundation, Inc.,
17 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
18 * http://www.gnu.org/copyleft/gpl.html
20 * @file
23 /**
24 * Virtual HTTP service client loosely styled after a Virtual File System
26 * Services can be mounted on path prefixes so that virtual HTTP operations
27 * against sub-paths will map to those services. Operations can actually be
28 * done using HTTP messages over the wire or may simple be emulated locally.
30 * Virtual HTTP request maps are arrays that use the following format:
31 * - method : GET/HEAD/PUT/POST/DELETE
32 * - url : HTTP/HTTPS URL or virtual service path with a registered prefix
33 * - query : <query parameter field/value associative array> (uses RFC 3986)
34 * - headers : <header name/value associative array>
35 * - body : source to get the HTTP request body from;
36 * this can simply be a string (always), a resource for
37 * PUT requests, and a field/value array for POST request;
38 * array bodies are encoded as multipart/form-data and strings
39 * use application/x-www-form-urlencoded (headers sent automatically)
40 * - stream : resource to stream the HTTP response body to
41 * Request maps can use integer index 0 instead of 'method' and 1 instead of 'url'.
43 * @author Aaron Schulz
44 * @since 1.23
46 class VirtualRESTServiceClient {
47 /** @var MultiHttpClient */
48 protected $http;
49 /** @var Array Map of (prefix => VirtualRESTService) */
50 protected $instances = array();
52 const VALID_MOUNT_REGEX = '#^/[0-9a-z]+/([0-9a-z]+/)*$#';
54 /**
55 * @param MultiHttpClient $http
57 public function __construct( MultiHttpClient $http ) {
58 $this->http = $http;
61 /**
62 * Map a prefix to service handler
64 * @param string $prefix Virtual path
65 * @param VirtualRESTService $instance
67 public function mount( $prefix, VirtualRESTService $instance ) {
68 if ( !preg_match( self::VALID_MOUNT_REGEX, $prefix ) ) {
69 throw new UnexpectedValueException( "Invalid service mount point '$prefix'." );
70 } elseif ( isset( $this->instances[$prefix] ) ) {
71 throw new UnexpectedValueException( "A service is already mounted on '$prefix'." );
73 $this->instances[$prefix] = $instance;
76 /**
77 * Unmap a prefix to service handler
79 * @param string $prefix Virtual path
81 public function unmount( $prefix ) {
82 if ( !preg_match( self::VALID_MOUNT_REGEX, $prefix ) ) {
83 throw new UnexpectedValueException( "Invalid service mount point '$prefix'." );
84 } elseif ( !isset( $this->instances[$prefix] ) ) {
85 throw new UnexpectedValueException( "No service is mounted on '$prefix'." );
87 unset( $this->instances[$prefix] );
90 /**
91 * Get the prefix and service that a virtual path is serviced by
93 * @param string $path
94 * @return array (prefix,VirtualRESTService) or (null,null) if none found
96 public function getMountAndService( $path ) {
97 $cmpFunc = function( $a, $b ) {
98 $al = substr_count( $a, '/' );
99 $bl = substr_count( $b, '/' );
100 if ( $al === $bl ) {
101 return 0; // should not actually happen
103 return ( $al < $bl ) ? 1 : -1; // largest prefix first
106 $matches = array(); // matching prefixes (mount points)
107 foreach ( $this->instances as $prefix => $service ) {
108 if ( strpos( $path, $prefix ) === 0 ) {
109 $matches[] = $prefix;
112 usort( $matches, $cmpFunc );
114 // Return the most specific prefix and corresponding service
115 return isset( $matches[0] )
116 ? array( $matches[0], $this->instances[$matches[0]] )
117 : array( null, null );
121 * Execute a virtual HTTP(S) request
123 * This method returns a response map of:
124 * - code : HTTP response code or 0 if there was a serious cURL error
125 * - reason : HTTP response reason (empty if there was a serious cURL error)
126 * - headers : <header name/value associative array>
127 * - body : HTTP response body or resource (if "stream" was set)
128 * - error : Any cURL error string
129 * The map also stores integer-indexed copies of these values. This lets callers do:
130 * <code>
131 * list( $rcode, $rdesc, $rhdrs, $rbody, $rerr ) = $client->run( $req );
132 * </code>
133 * @param array $req Virtual HTTP request maps
134 * @return array Response array for request
136 public function run( array $req ) {
137 $responses = $this->runMulti( array( $req ) );
138 return $responses[0];
142 * Execute a set of virtual HTTP(S) requests concurrently
144 * A map of requests keys to response maps is returned. Each response map has:
145 * - code : HTTP response code or 0 if there was a serious cURL error
146 * - reason : HTTP response reason (empty if there was a serious cURL error)
147 * - headers : <header name/value associative array>
148 * - body : HTTP response body or resource (if "stream" was set)
149 * - error : Any cURL error string
150 * The map also stores integer-indexed copies of these values. This lets callers do:
151 * <code>
152 * list( $rcode, $rdesc, $rhdrs, $rbody, $rerr ) = $responses[0];
153 * </code>
155 * @param array $reqs Map of Virtual HTTP request maps
156 * @return array $reqs Map of corresponding response values with the same keys/order
157 * @throws Exception
159 public function runMulti( array $reqs ) {
160 foreach ( $reqs as $index => &$req ) {
161 if ( isset( $req[0] ) ) {
162 $req['method'] = $req[0]; // short-form
163 unset( $req[0] );
165 if ( isset( $req[1] ) ) {
166 $req['url'] = $req[1]; // short-form
167 unset( $req[1] );
169 $req['chain'] = array(); // chain or list of replaced requests
171 unset( $req ); // don't assign over this by accident
173 $curUniqueId = 0;
174 $armoredIndexMap = array(); // (original index => new index)
176 $doneReqs = array(); // (index => request)
177 $executeReqs = array(); // (index => request)
178 $replaceReqsByService = array(); // (prefix => index => request)
179 $origPending = array(); // (index => 1) for original requests
181 foreach ( $reqs as $origIndex => $req ) {
182 // Re-index keys to consecutive integers (they will be swapped back later)
183 $index = $curUniqueId++;
184 $armoredIndexMap[$origIndex] = $index;
185 $origPending[$index] = 1;
186 if ( preg_match( '#^(http|ftp)s?://#', $req['url'] ) ) {
187 // Absolute FTP/HTTP(S) URL, run it as normal
188 $executeReqs[$index] = $req;
189 } else {
190 // Must be a virtual HTTP URL; resolve it
191 list( $prefix, $service ) = $this->getMountAndService( $req['url'] );
192 if ( !$service ) {
193 throw new UnexpectedValueException( "Path '{$req['url']}' has no service." );
195 // Set the URL to the mount-relative portion
196 $req['url'] = substr( $req['url'], strlen( $prefix ) );
197 $replaceReqsByService[$prefix][$index] = $req;
201 // Function to get IDs that won't collide with keys in $armoredIndexMap
202 $idFunc = function() use ( &$curUniqueId ) {
203 return $curUniqueId++;
206 $rounds = 0;
207 do {
208 if ( ++$rounds > 5 ) { // sanity
209 throw new Exception( "Too many replacement rounds detected. Aborting." );
211 // Track requests executed this round that have a prefix/service.
212 // Note that this also includes requests where 'response' was forced.
213 $checkReqIndexesByPrefix = array();
214 // Resolve the virtual URLs valid and qualified HTTP(S) URLs
215 // and add any required authentication headers for the backend.
216 // Services can also replace requests with new ones, either to
217 // defer the original or to set a proxy response to the original.
218 $newReplaceReqsByService = array();
219 foreach ( $replaceReqsByService as $prefix => $servReqs ) {
220 $service = $this->instances[$prefix];
221 foreach ( $service->onRequests( $servReqs, $idFunc ) as $index => $req ) {
222 // Services use unique IDs for replacement requests
223 if ( isset( $servReqs[$index] ) || isset( $origPending[$index] ) ) {
224 // A current or original request which was not modified
225 } else {
226 // Replacement request that will convert to original requests
227 $newReplaceReqsByService[$prefix][$index] = $req;
229 if ( isset( $req['response'] ) ) {
230 // Replacement requests with pre-set responses should not execute
231 unset( $executeReqs[$index] );
232 unset( $origPending[$index] );
233 $doneReqs[$index] = $req;
234 } else {
235 // Original or mangled request included
236 $executeReqs[$index] = $req;
238 $checkReqIndexesByPrefix[$prefix][$index] = 1;
241 // Update index of requests to inspect for replacement
242 $replaceReqsByService = $newReplaceReqsByService;
243 // Run the actual work HTTP requests
244 foreach ( $this->http->runMulti( $executeReqs ) as $index => $ranReq ) {
245 $doneReqs[$index] = $ranReq;
246 unset( $origPending[$index] );
248 $executeReqs = array();
249 // Services can also replace requests with new ones, either to
250 // defer the original or to set a proxy response to the original.
251 // Any replacement requests executed above will need to be replaced
252 // with new requests (eventually the original). The responses can be
253 // forced by setting 'response' rather than actually be sent over the wire.
254 $newReplaceReqsByService = array();
255 foreach ( $checkReqIndexesByPrefix as $prefix => $servReqIndexes ) {
256 $service = $this->instances[$prefix];
257 // $doneReqs actually has the requests (with 'response' set)
258 $servReqs = array_intersect_key( $doneReqs, $servReqIndexes );
259 foreach ( $service->onResponses( $servReqs, $idFunc ) as $index => $req ) {
260 // Services use unique IDs for replacement requests
261 if ( isset( $servReqs[$index] ) || isset( $origPending[$index] ) ) {
262 // A current or original request which was not modified
263 } else {
264 // Replacement requests with pre-set responses should not execute
265 $newReplaceReqsByService[$prefix][$index] = $req;
267 if ( isset( $req['response'] ) ) {
268 // Replacement requests with pre-set responses should not execute
269 unset( $origPending[$index] );
270 $doneReqs[$index] = $req;
271 } else {
272 // Update the request in case it was mangled
273 $executeReqs[$index] = $req;
277 // Update index of requests to inspect for replacement
278 $replaceReqsByService = $newReplaceReqsByService;
279 } while ( count( $origPending ) );
281 $responses = array();
282 // Update $reqs to include 'response' and normalized request 'headers'.
283 // This maintains the original order of $reqs.
284 foreach ( $reqs as $origIndex => $req ) {
285 $index = $armoredIndexMap[$origIndex];
286 if ( !isset( $doneReqs[$index] ) ) {
287 throw new UnexpectedValueException( "Response for request '$index' is NULL." );
289 $responses[$origIndex] = $doneReqs[$index]['response'];
292 return $responses;