@@ -68,7 +68,7 @@ |
||
| 68 | 68 | } |
| 69 | 69 | |
| 70 | 70 | /** |
| 71 | - * @param CrawlUrl|\Psr\Http\Message\UriInterface|string $crawlUrl |
|
| 71 | + * @param CrawlUrl $crawlUrl |
|
| 72 | 72 | * |
| 73 | 73 | * @return bool |
| 74 | 74 | */ |
@@ -2,8 +2,8 @@ |
||
| 2 | 2 | |
| 3 | 3 | namespace Spatie\Crawler\CrawlQueue; |
| 4 | 4 | |
| 5 | -use Spatie\Crawler\CrawlUrl; |
|
| 6 | 5 | use Illuminate\Support\Collection; |
| 6 | +use Spatie\Crawler\CrawlUrl; |
|
| 7 | 7 | use Spatie\Crawler\Exception\UrlNotFoundByIndex; |
| 8 | 8 | |
| 9 | 9 | class CollectionCrawlQueue implements CrawlQueue |
@@ -3,23 +3,23 @@ |
||
| 3 | 3 | namespace Spatie\Crawler; |
| 4 | 4 | |
| 5 | 5 | use Generator; |
| 6 | -use Tree\Node\Node; |
|
| 7 | -use GuzzleHttp\Pool; |
|
| 8 | 6 | use GuzzleHttp\Client; |
| 9 | -use GuzzleHttp\Psr7\Uri; |
|
| 7 | +use GuzzleHttp\Exception\RequestException; |
|
| 8 | +use GuzzleHttp\Pool; |
|
| 10 | 9 | use GuzzleHttp\Psr7\Request; |
| 11 | -use InvalidArgumentException; |
|
| 10 | +use GuzzleHttp\Psr7\Uri; |
|
| 12 | 11 | use GuzzleHttp\RequestOptions; |
| 13 | 12 | use Illuminate\Support\Collection; |
| 13 | +use InvalidArgumentException; |
|
| 14 | +use Psr\Http\Message\ResponseInterface; |
|
| 15 | +use Psr\Http\Message\StreamInterface; |
|
| 14 | 16 | use Psr\Http\Message\UriInterface; |
| 15 | 17 | use Spatie\Browsershot\Browsershot; |
| 16 | -use Psr\Http\Message\StreamInterface; |
|
| 17 | -use Symfony\Component\DomCrawler\Link; |
|
| 18 | -use Psr\Http\Message\ResponseInterface; |
|
| 19 | -use Spatie\Crawler\CrawlQueue\CrawlQueue; |
|
| 20 | -use GuzzleHttp\Exception\RequestException; |
|
| 21 | 18 | use Spatie\Crawler\CrawlQueue\CollectionCrawlQueue; |
| 19 | +use Spatie\Crawler\CrawlQueue\CrawlQueue; |
|
| 22 | 20 | use Symfony\Component\DomCrawler\Crawler as DomCrawler; |
| 21 | +use Symfony\Component\DomCrawler\Link; |
|
| 22 | +use Tree\Node\Node; |
|
| 23 | 23 | |
| 24 | 24 | class Crawler |
| 25 | 25 | { |
@@ -178,7 +178,7 @@ discard block |
||
| 178 | 178 | } |
| 179 | 179 | |
| 180 | 180 | /** |
| 181 | - * @param \Spatie\Crawler\CrawlObserver|array[\Spatie\Crawler\CrawlObserver] $crawlObserver |
|
| 181 | + * @param \Spatie\Crawler\CrawlObserver|array[\Spatie\Crawler\CrawlObserver] $crawlObservers |
|
| 182 | 182 | * |
| 183 | 183 | * @return $this |
| 184 | 184 | */ |
@@ -291,6 +291,9 @@ discard block |
||
| 291 | 291 | strlen($haystack); |
| 292 | 292 | } |
| 293 | 293 | |
| 294 | + /** |
|
| 295 | + * @param integer $readMaximumBytes |
|
| 296 | + */ |
|
| 294 | 297 | protected function convertBodyToString(StreamInterface $bodyStream, $readMaximumBytes = 1024 * 1024 * 2): string |
| 295 | 298 | { |
| 296 | 299 | $bodyStream->rewind(); |
@@ -404,6 +407,9 @@ discard block |
||
| 404 | 407 | return in_array($uri->getScheme(), ['http', 'https']); |
| 405 | 408 | } |
| 406 | 409 | |
| 410 | + /** |
|
| 411 | + * @return Node |
|
| 412 | + */ |
|
| 407 | 413 | protected function addtoDepthTree(Node $node, UriInterface $url, UriInterface $parentUrl) |
| 408 | 414 | { |
| 409 | 415 | $returnNode = null; |