1
|
|
|
<?php declare(strict_types=1); |
2
|
|
|
|
3
|
|
|
namespace Bigwhoop\Trumpet\Commands; |
4
|
|
|
|
5
|
|
|
use Bigwhoop\SentenceBreaker\SentenceBreaker; |
6
|
|
|
|
7
|
|
|
final class WikiCommand implements Command |
8
|
|
|
{ |
9
|
|
|
const ENDPOINT = 'https://en.wikipedia.org/w/api.php'; |
10
|
|
|
|
11
|
|
|
/** @var CommandExecutionContext */ |
12
|
|
|
private $executionContext; |
13
|
|
|
|
14
|
|
|
/** @var SentenceBreaker */ |
15
|
|
|
private $sentenceBreaker; |
16
|
|
|
|
17
|
1 |
|
public function __construct(CommandExecutionContext $context, SentenceBreaker $sentenceBreaker) |
18
|
|
|
{ |
19
|
1 |
|
$this->executionContext = $context; |
20
|
1 |
|
$this->sentenceBreaker = $sentenceBreaker; |
21
|
1 |
|
} |
22
|
|
|
|
23
|
1 |
|
public function getToken(): string |
24
|
|
|
{ |
25
|
1 |
|
return 'wiki'; |
26
|
|
|
} |
27
|
|
|
|
28
|
|
|
public function execute(CommandParams $params, CommandExecutionContext $executionContext): string |
29
|
|
|
{ |
30
|
|
|
$article = $params->getFirstArgument(); |
31
|
|
|
$numSentences = (int) $params->getSecondArgument(0); |
32
|
|
|
|
33
|
|
|
$cacheFile = $this->getCacheFilePath($article); |
34
|
|
|
if (is_readable($cacheFile)) { |
35
|
|
|
$summary = file_get_contents($cacheFile); |
36
|
|
|
|
37
|
|
|
return $this->quote($summary, $numSentences); |
38
|
|
|
} |
39
|
|
|
|
40
|
|
|
$url = $this->buildURL($article); |
41
|
|
|
$response = file_get_contents($url); |
42
|
|
|
|
43
|
|
|
$data = json_decode($response); |
44
|
|
|
if (!$data) { |
45
|
|
|
throw new ExecutionFailedException('Wikipedia API response could not be decoded. Request URL: '.$url.'. Response: '.var_export($response, true)); |
46
|
|
|
} |
47
|
|
|
|
48
|
|
|
foreach ($data->query->pages as $page) { |
49
|
|
|
if (isset($page->missing)) { |
50
|
|
|
continue; |
51
|
|
|
} |
52
|
|
|
|
53
|
|
|
file_put_contents($cacheFile, $page->extract); |
54
|
|
|
|
55
|
|
|
return $this->quote($page->extract, $numSentences); |
56
|
|
|
} |
57
|
|
|
|
58
|
|
|
throw new ExecutionFailedException("Failed to query for Wikipedia article '$article'. Request URL: $url"); |
59
|
|
|
} |
60
|
|
|
|
61
|
|
|
private function getCacheFilePath(string $article): string |
62
|
|
|
{ |
63
|
|
|
$tmpDir = $this->executionContext->ensureTempDirectory(); |
64
|
|
|
|
65
|
|
|
return $tmpDir.'/summary-'.md5($article).'.txt'; |
66
|
|
|
} |
67
|
|
|
|
68
|
|
|
private function quote(string $text, int $numSentences): string |
69
|
|
|
{ |
70
|
|
|
if ($numSentences > 0) { |
71
|
|
|
$sentences = $this->sentenceBreaker->split($text); |
72
|
|
|
$text = join(' ', array_slice($sentences, 0, $numSentences)); |
73
|
|
|
} |
74
|
|
|
|
75
|
|
|
return "> $text"; |
76
|
|
|
} |
77
|
|
|
|
78
|
|
|
private function buildURL(string $article): string |
79
|
|
|
{ |
80
|
|
|
$params = [ |
81
|
|
|
'format' => 'json', |
82
|
|
|
'action' => 'query', |
83
|
|
|
'prop' => 'extracts', |
84
|
|
|
'exintro' => '', |
85
|
|
|
'explaintext' => '', |
86
|
|
|
'titles' => $article, |
87
|
|
|
]; |
88
|
|
|
|
89
|
|
|
return self::ENDPOINT.'?'.http_build_query($params, null, '&', PHP_QUERY_RFC3986); |
90
|
|
|
} |
91
|
|
|
} |
92
|
|
|
|