@@ -68,7 +68,7 @@ |
||
| 68 | 68 | } |
| 69 | 69 | |
| 70 | 70 | /** |
| 71 | - * @param CrawlUrl|\Psr\Http\Message\UriInterface|string $crawlUrl |
|
| 71 | + * @param CrawlUrl $crawlUrl |
|
| 72 | 72 | * |
| 73 | 73 | * @return bool |
| 74 | 74 | */ |
@@ -3,8 +3,8 @@ |
||
| 3 | 3 | namespace Spatie\Crawler\CrawlQueue; |
| 4 | 4 | |
| 5 | 5 | use Spatie\Crawler\CrawlUrl; |
| 6 | -use Tightenco\Collect\Support\Collection; |
|
| 7 | 6 | use Spatie\Crawler\Exception\UrlNotFoundByIndex; |
| 7 | +use Tightenco\Collect\Support\Collection; |
|
| 8 | 8 | |
| 9 | 9 | class CollectionCrawlQueue implements CrawlQueue |
| 10 | 10 | { |
@@ -3,23 +3,23 @@ |
||
| 3 | 3 | namespace Spatie\Crawler; |
| 4 | 4 | |
| 5 | 5 | use Generator; |
| 6 | -use Tree\Node\Node; |
|
| 7 | -use GuzzleHttp\Pool; |
|
| 8 | 6 | use GuzzleHttp\Client; |
| 9 | -use GuzzleHttp\Psr7\Uri; |
|
| 7 | +use GuzzleHttp\Exception\RequestException; |
|
| 8 | +use GuzzleHttp\Pool; |
|
| 10 | 9 | use GuzzleHttp\Psr7\Request; |
| 11 | -use InvalidArgumentException; |
|
| 10 | +use GuzzleHttp\Psr7\Uri; |
|
| 12 | 11 | use GuzzleHttp\RequestOptions; |
| 12 | +use InvalidArgumentException; |
|
| 13 | +use Psr\Http\Message\ResponseInterface; |
|
| 14 | +use Psr\Http\Message\StreamInterface; |
|
| 13 | 15 | use Psr\Http\Message\UriInterface; |
| 14 | 16 | use Spatie\Browsershot\Browsershot; |
| 15 | -use Psr\Http\Message\StreamInterface; |
|
| 16 | -use Symfony\Component\DomCrawler\Link; |
|
| 17 | -use Psr\Http\Message\ResponseInterface; |
|
| 18 | -use Spatie\Crawler\CrawlQueue\CrawlQueue; |
|
| 19 | -use Tightenco\Collect\Support\Collection; |
|
| 20 | -use GuzzleHttp\Exception\RequestException; |
|
| 21 | 17 | use Spatie\Crawler\CrawlQueue\CollectionCrawlQueue; |
| 18 | +use Spatie\Crawler\CrawlQueue\CrawlQueue; |
|
| 22 | 19 | use Symfony\Component\DomCrawler\Crawler as DomCrawler; |
| 20 | +use Symfony\Component\DomCrawler\Link; |
|
| 21 | +use Tightenco\Collect\Support\Collection; |
|
| 22 | +use Tree\Node\Node; |
|
| 23 | 23 | |
| 24 | 24 | class Crawler |
| 25 | 25 | { |
@@ -292,6 +292,9 @@ discard block |
||
| 292 | 292 | strlen($haystack); |
| 293 | 293 | } |
| 294 | 294 | |
| 295 | + /** |
|
| 296 | + * @param integer $readMaximumBytes |
|
| 297 | + */ |
|
| 295 | 298 | protected function convertBodyToString(StreamInterface $bodyStream, $readMaximumBytes = 1024 * 1024 * 2): string |
| 296 | 299 | { |
| 297 | 300 | $bodyStream->rewind(); |
@@ -302,7 +305,7 @@ discard block |
||
| 302 | 305 | } |
| 303 | 306 | |
| 304 | 307 | /** |
| 305 | - * @param ResponseInterface|null $response |
|
| 308 | + * @param ResponseInterface $response |
|
| 306 | 309 | * @param CrawlUrl $crawlUrl |
| 307 | 310 | */ |
| 308 | 311 | protected function handleCrawled(ResponseInterface $response, CrawlUrl $crawlUrl) |
@@ -429,6 +432,9 @@ discard block |
||
| 429 | 432 | return in_array($uri->getScheme(), ['http', 'https']); |
| 430 | 433 | } |
| 431 | 434 | |
| 435 | + /** |
|
| 436 | + * @return Node |
|
| 437 | + */ |
|
| 432 | 438 | protected function addtoDepthTree(Node $node, UriInterface $url, UriInterface $parentUrl) |
| 433 | 439 | { |
| 434 | 440 | $returnNode = null; |
@@ -2,9 +2,9 @@ |
||
| 2 | 2 | |
| 3 | 3 | namespace Spatie\Crawler; |
| 4 | 4 | |
| 5 | -use Psr\Http\Message\UriInterface; |
|
| 6 | -use Psr\Http\Message\ResponseInterface; |
|
| 7 | 5 | use GuzzleHttp\Exception\RequestException; |
| 6 | +use Psr\Http\Message\ResponseInterface; |
|
| 7 | +use Psr\Http\Message\UriInterface; |
|
| 8 | 8 | |
| 9 | 9 | abstract class CrawlObserver |
| 10 | 10 | { |