1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49
|
<?php
/**
* @file
* @author Niklas Laxström
* @license GPL-2.0-or-later
*/
namespace LocalisationUpdate\Fetcher;
/**
* This class uses GitHub api to obtain a list of files present in a directory
* to avoid fetching files that don't exist.
*
* @todo Could use file hashes to 1) avoid fetching files with same hash as
* the source. 2) avoid fetching files which haven't changed since last check
* if we store them.
*/
class GitHubFetcher extends HttpFetcher {
/**
* @param string $pattern
*
* @return array
* @throws \Exception
*/
public function fetchDirectory( $pattern ) {
global $wgLocalisationUpdateHttpRequestOptions;
$domain = preg_quote( 'https://raw.github.com/', '~' );
$p = "~^$domain(?P<org>[^/]+)/(?P<repo>[^/]+)/(?P<branch>[^/]+)/(?P<path>.+)/.+$~";
preg_match( $p, $pattern, $m );
$apiURL = "https://api.github.com/repos/{$m['org']}/{$m['repo']}/contents/{$m['path']}";
$json = \Http::get( $apiURL, $wgLocalisationUpdateHttpRequestOptions, __METHOD__ );
if ( !$json ) {
throw new \Exception( "Unable to get directory listing for {$m['org']}/{$m['repo']}" );
}
$files = [];
$json = \FormatJson::decode( $json, true );
foreach ( $json as $fileinfo ) {
$fileurl = dirname( $pattern ) . '/' . $fileinfo['name'];
$file = $this->fetchFile( $fileurl );
if ( $file ) {
$files[$fileurl] = $file;
}
}
return $files;
}
}
|