@@ -68,7 +68,7 @@ |
||
68 | 68 | } |
69 | 69 | |
70 | 70 | /** |
71 | - * @param CrawlUrl|\Psr\Http\Message\UriInterface|string $crawlUrl |
|
71 | + * @param CrawlUrl $crawlUrl |
|
72 | 72 | * |
73 | 73 | * @return bool |
74 | 74 | */ |
@@ -3,8 +3,8 @@ |
||
3 | 3 | namespace Spatie\Crawler\CrawlQueue; |
4 | 4 | |
5 | 5 | use Spatie\Crawler\CrawlUrl; |
6 | -use Tightenco\Collect\Support\Collection; |
|
7 | 6 | use Spatie\Crawler\Exception\UrlNotFoundByIndex; |
7 | +use Tightenco\Collect\Support\Collection; |
|
8 | 8 | |
9 | 9 | class CollectionCrawlQueue implements CrawlQueue |
10 | 10 | { |
@@ -3,23 +3,23 @@ |
||
3 | 3 | namespace Spatie\Crawler; |
4 | 4 | |
5 | 5 | use Generator; |
6 | -use Tree\Node\Node; |
|
7 | -use GuzzleHttp\Pool; |
|
8 | 6 | use GuzzleHttp\Client; |
9 | -use GuzzleHttp\Psr7\Uri; |
|
7 | +use GuzzleHttp\Exception\RequestException; |
|
8 | +use GuzzleHttp\Pool; |
|
10 | 9 | use GuzzleHttp\Psr7\Request; |
11 | -use InvalidArgumentException; |
|
10 | +use GuzzleHttp\Psr7\Uri; |
|
12 | 11 | use GuzzleHttp\RequestOptions; |
12 | +use InvalidArgumentException; |
|
13 | +use Psr\Http\Message\ResponseInterface; |
|
14 | +use Psr\Http\Message\StreamInterface; |
|
13 | 15 | use Psr\Http\Message\UriInterface; |
14 | 16 | use Spatie\Browsershot\Browsershot; |
15 | -use Psr\Http\Message\StreamInterface; |
|
16 | -use Symfony\Component\DomCrawler\Link; |
|
17 | -use Psr\Http\Message\ResponseInterface; |
|
18 | -use Spatie\Crawler\CrawlQueue\CrawlQueue; |
|
19 | -use Tightenco\Collect\Support\Collection; |
|
20 | -use GuzzleHttp\Exception\RequestException; |
|
21 | 17 | use Spatie\Crawler\CrawlQueue\CollectionCrawlQueue; |
18 | +use Spatie\Crawler\CrawlQueue\CrawlQueue; |
|
22 | 19 | use Symfony\Component\DomCrawler\Crawler as DomCrawler; |
20 | +use Symfony\Component\DomCrawler\Link; |
|
21 | +use Tightenco\Collect\Support\Collection; |
|
22 | +use Tree\Node\Node; |
|
23 | 23 | |
24 | 24 | class Crawler |
25 | 25 | { |
@@ -292,6 +292,9 @@ discard block |
||
292 | 292 | strlen($haystack); |
293 | 293 | } |
294 | 294 | |
295 | + /** |
|
296 | + * @param integer $readMaximumBytes |
|
297 | + */ |
|
295 | 298 | protected function convertBodyToString(StreamInterface $bodyStream, $readMaximumBytes = 1024 * 1024 * 2): string |
296 | 299 | { |
297 | 300 | $bodyStream->rewind(); |
@@ -302,7 +305,7 @@ discard block |
||
302 | 305 | } |
303 | 306 | |
304 | 307 | /** |
305 | - * @param ResponseInterface|null $response |
|
308 | + * @param ResponseInterface $response |
|
306 | 309 | * @param CrawlUrl $crawlUrl |
307 | 310 | */ |
308 | 311 | protected function handleCrawled(ResponseInterface $response, CrawlUrl $crawlUrl) |
@@ -429,6 +432,9 @@ discard block |
||
429 | 432 | return in_array($uri->getScheme(), ['http', 'https']); |
430 | 433 | } |
431 | 434 | |
435 | + /** |
|
436 | + * @return Node |
|
437 | + */ |
|
432 | 438 | protected function addtoDepthTree(Node $node, UriInterface $url, UriInterface $parentUrl) |
433 | 439 | { |
434 | 440 | $returnNode = null; |
@@ -2,9 +2,9 @@ |
||
2 | 2 | |
3 | 3 | namespace Spatie\Crawler; |
4 | 4 | |
5 | -use Psr\Http\Message\UriInterface; |
|
6 | -use Psr\Http\Message\ResponseInterface; |
|
7 | 5 | use GuzzleHttp\Exception\RequestException; |
6 | +use Psr\Http\Message\ResponseInterface; |
|
7 | +use Psr\Http\Message\UriInterface; |
|
8 | 8 | |
9 | 9 | abstract class CrawlObserver |
10 | 10 | { |