summaryrefslogtreecommitdiff
blob: eba89a9e2d2e2c24aab892096672ae7b573349b5 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
<?php
/**
 * @file
 * @author Niklas Laxström
 * @license GPL-2.0-or-later
 */

namespace LocalisationUpdate\Fetcher;

/**
 * This class uses GitHub api to obtain a list of files present in a directory
 * to avoid fetching files that don't exist.
 *
 * @todo Could use file hashes to 1) avoid fetching files with same hash as
 * the source. 2) avoid fetching files which haven't changed since last check
 * if we store them.
 */
class GitHubFetcher extends HttpFetcher {
	/**
	 * @param string $pattern
	 *
	 * @return array
	 * @throws \Exception
	 */
	public function fetchDirectory( $pattern ) {
		global $wgLocalisationUpdateHttpRequestOptions;

		$domain = preg_quote( 'https://raw.github.com/', '~' );
		$p = "~^$domain(?P<org>[^/]+)/(?P<repo>[^/]+)/(?P<branch>[^/]+)/(?P<path>.+)/.+$~";
		preg_match( $p, $pattern, $m );

		$apiURL = "https://api.github.com/repos/{$m['org']}/{$m['repo']}/contents/{$m['path']}";
		$json = \Http::get( $apiURL, $wgLocalisationUpdateHttpRequestOptions, __METHOD__ );
		if ( !$json ) {
			throw new \Exception( "Unable to get directory listing for {$m['org']}/{$m['repo']}" );
		}

		$files = [];
		$json = \FormatJson::decode( $json, true );
		foreach ( $json as $fileinfo ) {
			$fileurl = dirname( $pattern ) . '/' . $fileinfo['name'];
			$file = $this->fetchFile( $fileurl );
			if ( $file ) {
				$files[$fileurl] = $file;
			}
		}
		return $files;
	}
}