@@ -66,7 +66,7 @@ discard block |
||
| 66 | 66 | $this->tableName, |
| 67 | 67 | $where, |
| 68 | 68 | '', |
| 69 | - htmlspecialchars($orderField) . ' ' . htmlspecialchars($orderDirection), |
|
| 69 | + htmlspecialchars($orderField).' '.htmlspecialchars($orderDirection), |
|
| 70 | 70 | self::getLimitFromItemCountAndOffset($itemCount, $offset) |
| 71 | 71 | ); |
| 72 | 72 | |
@@ -111,7 +111,7 @@ discard block |
||
| 111 | 111 | */ |
| 112 | 112 | public function countNotTimeouted($ttl) |
| 113 | 113 | { |
| 114 | - return $this->countByWhere('deleted = 0 AND ttl > ' . intval($ttl)); |
|
| 114 | + return $this->countByWhere('deleted = 0 AND ttl > '.intval($ttl)); |
|
| 115 | 115 | } |
| 116 | 116 | |
| 117 | 117 | /** |
@@ -127,7 +127,7 @@ discard block |
||
| 127 | 127 | { |
| 128 | 128 | $itemCount = filter_var($itemCount, FILTER_VALIDATE_INT, ['options' => ['min_range' => 1, 'default' => 20]]); |
| 129 | 129 | $offset = filter_var($offset, FILTER_VALIDATE_INT, ['options' => ['min_range' => 0, 'default' => 0]]); |
| 130 | - $limit = $offset . ', ' . $itemCount; |
|
| 130 | + $limit = $offset.', '.$itemCount; |
|
| 131 | 131 | |
| 132 | 132 | return $limit; |
| 133 | 133 | } |
@@ -47,7 +47,7 @@ |
||
| 47 | 47 | public function execute() |
| 48 | 48 | { |
| 49 | 49 | $processManager = new \tx_crawler_domain_process_manager(); |
| 50 | - $timeout = is_int($this->timeOut) ? (int)$this->timeOut : 1800; |
|
| 50 | + $timeout = is_int($this->timeOut) ? (int) $this->timeOut : 1800; |
|
| 51 | 51 | |
| 52 | 52 | try { |
| 53 | 53 | $processManager->multiProcess($timeout); |
@@ -12,12 +12,12 @@ discard block |
||
| 12 | 12 | if (!isAbsPath($tempPathThisScript)) { |
| 13 | 13 | $workingDirectory = $_SERVER['PWD'] ? $_SERVER['PWD'] : getcwd(); |
| 14 | 14 | if ($workingDirectory) { |
| 15 | - $tempPathThisScript = $workingDirectory . '/' . preg_replace('/\.\//', '', $tempPathThisScript); |
|
| 15 | + $tempPathThisScript = $workingDirectory.'/'.preg_replace('/\.\//', '', $tempPathThisScript); |
|
| 16 | 16 | if (!@is_file($tempPathThisScript)) { |
| 17 | - die('Relative path found, but an error occured during resolving of the absolute path: ' . $tempPathThisScript . PHP_EOL); |
|
| 17 | + die('Relative path found, but an error occured during resolving of the absolute path: '.$tempPathThisScript.PHP_EOL); |
|
| 18 | 18 | } |
| 19 | 19 | } else { |
| 20 | - die('Relative path found, but resolving absolute path is not supported on this platform.' . PHP_EOL); |
|
| 20 | + die('Relative path found, but resolving absolute path is not supported on this platform.'.PHP_EOL); |
|
| 21 | 21 | } |
| 22 | 22 | } |
| 23 | 23 | |
@@ -35,7 +35,7 @@ discard block |
||
| 35 | 35 | list($key, $value) = explode(':', $additionalHeader, 2); |
| 36 | 36 | $key = str_replace('-', '_', strtoupper(trim($key))); |
| 37 | 37 | if ($key != 'HOST') { |
| 38 | - $_SERVER['HTTP_' . $key] = $value; |
|
| 38 | + $_SERVER['HTTP_'.$key] = $value; |
|
| 39 | 39 | } |
| 40 | 40 | } |
| 41 | 41 | } |
@@ -57,18 +57,18 @@ discard block |
||
| 57 | 57 | $typo3SitePath = $_SERVER['argv'][1]; |
| 58 | 58 | |
| 59 | 59 | // faking the environment |
| 60 | -$_SERVER['DOCUMENT_ROOT'] = preg_replace('#' . preg_quote($typo3SitePath, '#') . '$#', '', $typo3Root); |
|
| 60 | +$_SERVER['DOCUMENT_ROOT'] = preg_replace('#'.preg_quote($typo3SitePath, '#').'$#', '', $typo3Root); |
|
| 61 | 61 | $_SERVER['HTTP_USER_AGENT'] = 'CLI Mode'; |
| 62 | 62 | $_SERVER['HTTP_HOST'] = $_SERVER['SERVER_NAME'] = $urlParts['host']; |
| 63 | -$_SERVER['SCRIPT_NAME'] = $_SERVER['PHP_SELF'] = $typo3SitePath . 'index.php'; |
|
| 64 | -$_SERVER['SCRIPT_FILENAME'] = $_SERVER['PATH_TRANSLATED'] = $typo3Root . 'index.php'; |
|
| 63 | +$_SERVER['SCRIPT_NAME'] = $_SERVER['PHP_SELF'] = $typo3SitePath.'index.php'; |
|
| 64 | +$_SERVER['SCRIPT_FILENAME'] = $_SERVER['PATH_TRANSLATED'] = $typo3Root.'index.php'; |
|
| 65 | 65 | $_SERVER['QUERY_STRING'] = (isset($urlParts['query']) ? $urlParts['query'] : ''); |
| 66 | -$_SERVER['REQUEST_URI'] = $urlParts['path'] . (isset($urlParts['query']) ? '?' . $urlParts['query'] : ''); |
|
| 66 | +$_SERVER['REQUEST_URI'] = $urlParts['path'].(isset($urlParts['query']) ? '?'.$urlParts['query'] : ''); |
|
| 67 | 67 | $_SERVER['REQUEST_METHOD'] = 'GET'; |
| 68 | 68 | |
| 69 | 69 | // Define a port if used in the URL: |
| 70 | 70 | if (isset($urlParts['port'])) { |
| 71 | - $_SERVER['HTTP_HOST'] .= ':' . $urlParts['port']; |
|
| 71 | + $_SERVER['HTTP_HOST'] .= ':'.$urlParts['port']; |
|
| 72 | 72 | $_SERVER['SERVER_PORT'] = $urlParts['port']; |
| 73 | 73 | } |
| 74 | 74 | |
@@ -78,7 +78,7 @@ discard block |
||
| 78 | 78 | } |
| 79 | 79 | |
| 80 | 80 | chdir($typo3Root); |
| 81 | -include($typo3Root . '/index.php'); |
|
| 81 | +include($typo3Root.'/index.php'); |
|
| 82 | 82 | |
| 83 | 83 | |
| 84 | 84 | /** |
@@ -59,7 +59,7 @@ discard block |
||
| 59 | 59 | $this->cli_options[] = ['-d depth', 'Tree depth, 0-99', "How many levels under the 'page_id' to include."]; |
| 60 | 60 | $this->cli_options[] = ['-o mode', 'Output mode: "url", "exec", "queue"', "Specifies output modes\nurl : Will list URLs which wget could use as input.\nqueue: Will put entries in queue table.\nexec: Will execute all entries right away!"]; |
| 61 | 61 | $this->cli_options[] = ['-n number', 'Number of items per minute.', 'Specifies how many items are put in the queue per minute. Only valid for output mode "queue"']; |
| 62 | - $this->cli_options[] = ['-conf configurationkeys','List of Configuration Keys','A commaseperated list of crawler configurations']; |
|
| 62 | + $this->cli_options[] = ['-conf configurationkeys', 'List of Configuration Keys', 'A commaseperated list of crawler configurations']; |
|
| 63 | 63 | # $this->cli_options[] = array('-v level', 'Verbosity level 0-3', "The value of level can be:\n 0 = all output\n 1 = info and greater (default)\n 2 = warnings and greater\n 3 = errors"); |
| 64 | 64 | |
| 65 | 65 | // Setting help texts: |
@@ -67,7 +67,7 @@ discard block |
||
| 67 | 67 | $this->cli_help['synopsis'] = 'page_id ###OPTIONS###'; |
| 68 | 68 | $this->cli_help['description'] = "Works as a CLI interface to some functionality from the Web > Info > Site Crawler module; It can put entries in the queue from command line options, return the list of URLs and even execute all entries right away without having to queue them up - this can be useful for immediate re-cache, re-indexing or static publishing from command line."; |
| 69 | 69 | $this->cli_help['examples'] = "/.../cli_dispatch.phpsh crawler_im 7 -d=2 -conf=<configurationKey> -o=exec\nWill re-cache pages from page 7 and two levels down, executed immediately.\n"; |
| 70 | - $this->cli_help['examples'].= "/.../cli_dispatch.phpsh crawler_im 7 -d=0 -conf=<configurationKey> -n=4 -o=queue\nWill put entries for re-caching pages from page 7 into queue, 4 every minute.\n"; |
|
| 70 | + $this->cli_help['examples'] .= "/.../cli_dispatch.phpsh crawler_im 7 -d=0 -conf=<configurationKey> -n=4 -o=queue\nWill put entries for re-caching pages from page 7 into queue, 4 every minute.\n"; |
|
| 71 | 71 | $this->cli_help['author'] = 'Kasper Skaarhoj, Daniel Poetzinger, Fabrizio Branca, Tolleiv Nietsch, Timo Schmidt - AOE media 2009'; |
| 72 | 72 | } |
| 73 | 73 | } |
@@ -9,5 +9,5 @@ |
||
| 9 | 9 | try { |
| 10 | 10 | $processManager->multiProcess($timeout); |
| 11 | 11 | } catch (Exception $e) { |
| 12 | - echo PHP_EOL . $e->getMessage(); |
|
| 12 | + echo PHP_EOL.$e->getMessage(); |
|
| 13 | 13 | } |
@@ -53,16 +53,16 @@ |
||
| 53 | 53 | </thead> |
| 54 | 54 | <tbody> |
| 55 | 55 | <?php foreach ($this->getProcessCollection() as $process): /* @var $process tx_crawler_domain_process */ ?> |
| 56 | - <tr class="<?php echo (++$count % 2 == 0) ? 'odd': 'even' ?>"> |
|
| 56 | + <tr class="<?php echo (++$count % 2 == 0) ? 'odd' : 'even' ?>"> |
|
| 57 | 57 | <td><?php echo $this->getIconForState(htmlspecialchars($process->getState())); ?></td> |
| 58 | 58 | <td><?php echo htmlspecialchars($process->getProcess_id()); ?></td> |
| 59 | 59 | <td><?php echo htmlspecialchars($this->asDate($process->getTimeForFirstItem())); ?></td> |
| 60 | 60 | <td><?php echo htmlspecialchars($this->asDate($process->getTimeForLastItem())); ?></td> |
| 61 | - <td><?php echo htmlspecialchars(floor($process->getRuntime()/ 60)); ?> min. <?php echo htmlspecialchars($process->getRuntime()) % 60 ?> sec.</td> |
|
| 61 | + <td><?php echo htmlspecialchars(floor($process->getRuntime() / 60)); ?> min. <?php echo htmlspecialchars($process->getRuntime()) % 60 ?> sec.</td> |
|
| 62 | 62 | <td><?php echo htmlspecialchars($this->asDate($process->getTTL())); ?></td> |
| 63 | 63 | <td><?php echo htmlspecialchars($process->countItemsProcessed()); ?></td> |
| 64 | 64 | <td><?php echo htmlspecialchars($process->countItemsAssigned()); ?></td> |
| 65 | - <td><?php echo htmlspecialchars($process->countItemsToProcess()+$process->countItemsProcessed()); ?></td> |
|
| 65 | + <td><?php echo htmlspecialchars($process->countItemsToProcess() + $process->countItemsProcessed()); ?></td> |
|
| 66 | 66 | <td> |
| 67 | 67 | <?php if ($process->getState() == 'running'): ?> |
| 68 | 68 | <div class="crawlerprocessprogress" style="width: 200px;"> |
@@ -3,12 +3,12 @@ |
||
| 3 | 3 | } ?> |
| 4 | 4 | |
| 5 | 5 | Page: |
| 6 | -<?php for ($currentPageOffset = 0; $currentPageOffset < $this->getTotalPagesCount(); $currentPageOffset++) { |
|
| 6 | +<?php for ($currentPageOffset = 0; $currentPageOffset < $this->getTotalPagesCount(); $currentPageOffset++) { |
|
| 7 | 7 | ?> |
| 8 | 8 | <a href="index.php?offset=<?php echo htmlspecialchars($currentPageOffset * $this->getPerPage()); ?>"> |
| 9 | 9 | <?php echo htmlspecialchars($this->getLabelForPageOffset($currentPageOffset)); ?> |
| 10 | 10 | </a> |
| 11 | - <?php if ($currentPageOffset+1 < $this->getTotalPagesCount()) { |
|
| 11 | + <?php if ($currentPageOffset + 1 < $this->getTotalPagesCount()) { |
|
| 12 | 12 | ?> |
| 13 | 13 | | |
| 14 | 14 | <?php |
@@ -50,8 +50,8 @@ discard block |
||
| 50 | 50 | */ |
| 51 | 51 | public function offsetGet($index) |
| 52 | 52 | { |
| 53 | - if (! parent::offsetExists($index)) { |
|
| 54 | - throw new Exception('Index "' . var_export($index, true) . '" for tx_crawler_domain_process are not available'); |
|
| 53 | + if (!parent::offsetExists($index)) { |
|
| 54 | + throw new Exception('Index "'.var_export($index, true).'" for tx_crawler_domain_process are not available'); |
|
| 55 | 55 | } |
| 56 | 56 | return parent::offsetGet($index); |
| 57 | 57 | } |
@@ -66,7 +66,7 @@ discard block |
||
| 66 | 66 | */ |
| 67 | 67 | public function offsetSet($index, $subject) |
| 68 | 68 | { |
| 69 | - if (! $subject instanceof tx_crawler_domain_process) { |
|
| 69 | + if (!$subject instanceof tx_crawler_domain_process) { |
|
| 70 | 70 | throw new InvalidArgumentException('Wrong parameter type given, "tx_crawler_domain_process" expected!'); |
| 71 | 71 | } |
| 72 | 72 | parent::offsetSet($index, $subject); |
@@ -80,7 +80,7 @@ discard block |
||
| 80 | 80 | */ |
| 81 | 81 | public function append($subject) |
| 82 | 82 | { |
| 83 | - if (! $subject instanceof tx_crawler_domain_process) { |
|
| 83 | + if (!$subject instanceof tx_crawler_domain_process) { |
|
| 84 | 84 | throw new InvalidArgumentException('Wrong parameter type given, "tx_crawler_domain_process" expected!'); |
| 85 | 85 | } |
| 86 | 86 | parent::append($subject); |
@@ -92,9 +92,9 @@ discard block |
||
| 92 | 92 | */ |
| 93 | 93 | public function getProcessIds() |
| 94 | 94 | { |
| 95 | - $result=[]; |
|
| 95 | + $result = []; |
|
| 96 | 96 | foreach ($this->getIterator() as $value) { |
| 97 | - $result[]=$value->getProcess_id(); |
|
| 97 | + $result[] = $value->getProcess_id(); |
|
| 98 | 98 | } |
| 99 | 99 | return $result; |
| 100 | 100 | } |
@@ -67,8 +67,8 @@ discard block |
||
| 67 | 67 | */ |
| 68 | 68 | public function __construct() |
| 69 | 69 | { |
| 70 | - $this->processRepository = new tx_crawler_domain_process_repository(); |
|
| 71 | - $this->queueRepository = new tx_crawler_domain_queue_repository(); |
|
| 70 | + $this->processRepository = new tx_crawler_domain_process_repository(); |
|
| 71 | + $this->queueRepository = new tx_crawler_domain_queue_repository(); |
|
| 72 | 72 | $this->crawlerObj = \TYPO3\CMS\Core\Utility\GeneralUtility::makeInstance('tx_crawler_lib'); |
| 73 | 73 | $this->timeToLive = intval($this->crawlerObj->extensionSettings['processMaxRunTime']); |
| 74 | 74 | $this->countInARun = intval($this->crawlerObj->extensionSettings['countInARun']); |
@@ -84,7 +84,7 @@ discard block |
||
| 84 | 84 | public function multiProcess($timeout) |
| 85 | 85 | { |
| 86 | 86 | if ($this->processLimit <= 1) { |
| 87 | - throw new RuntimeException('To run crawler in multi process mode you have to configure the processLimit > 1.' . PHP_EOL); |
|
| 87 | + throw new RuntimeException('To run crawler in multi process mode you have to configure the processLimit > 1.'.PHP_EOL); |
|
| 88 | 88 | } |
| 89 | 89 | |
| 90 | 90 | $pendingItemsStart = $this->queueRepository->countAllPendingItems(); |
@@ -102,7 +102,7 @@ discard block |
||
| 102 | 102 | } |
| 103 | 103 | if ($currentPendingItems == 0) { |
| 104 | 104 | if ($this->verbose) { |
| 105 | - echo 'Finished...' . chr(10); |
|
| 105 | + echo 'Finished...'.chr(10); |
|
| 106 | 106 | } |
| 107 | 107 | break; |
| 108 | 108 | } |
@@ -114,16 +114,16 @@ discard block |
||
| 114 | 114 | } |
| 115 | 115 | sleep(1); |
| 116 | 116 | if ($nextTimeOut < time()) { |
| 117 | - $timedOutProcesses = $this->processRepository->findAll('', 'DESC', null, 0, 'ttl >' . $nextTimeOut); |
|
| 117 | + $timedOutProcesses = $this->processRepository->findAll('', 'DESC', null, 0, 'ttl >'.$nextTimeOut); |
|
| 118 | 118 | $nextTimeOut = time() + $this->timeToLive; |
| 119 | 119 | if ($this->verbose) { |
| 120 | - echo 'Cleanup' . implode(',', $timedOutProcesses->getProcessIds()) . chr(10); |
|
| 120 | + echo 'Cleanup'.implode(',', $timedOutProcesses->getProcessIds()).chr(10); |
|
| 121 | 121 | } |
| 122 | 122 | $this->crawlerObj->CLI_releaseProcesses($timedOutProcesses->getProcessIds(), true); |
| 123 | 123 | } |
| 124 | 124 | } |
| 125 | 125 | if ($currentPendingItems > 0 && $this->verbose) { |
| 126 | - echo 'Stop with timeout' . chr(10); |
|
| 126 | + echo 'Stop with timeout'.chr(10); |
|
| 127 | 127 | } |
| 128 | 128 | } |
| 129 | 129 | |
@@ -143,17 +143,17 @@ discard block |
||
| 143 | 143 | private function startRequiredProcesses() |
| 144 | 144 | { |
| 145 | 145 | $ret = false; |
| 146 | - $currentProcesses= $this->processRepository->countActive(); |
|
| 147 | - $availableProcessesCount = $this->processLimit-$currentProcesses; |
|
| 146 | + $currentProcesses = $this->processRepository->countActive(); |
|
| 147 | + $availableProcessesCount = $this->processLimit - $currentProcesses; |
|
| 148 | 148 | $requiredProcessesCount = ceil($this->queueRepository->countAllUnassignedPendingItems() / $this->countInARun); |
| 149 | - $startProcessCount = min([$availableProcessesCount,$requiredProcessesCount]); |
|
| 149 | + $startProcessCount = min([$availableProcessesCount, $requiredProcessesCount]); |
|
| 150 | 150 | if ($startProcessCount <= 0) { |
| 151 | 151 | return $ret; |
| 152 | 152 | } |
| 153 | 153 | if ($startProcessCount && $this->verbose) { |
| 154 | 154 | echo 'Start '.$startProcessCount.' new processes (Running:'.$currentProcesses.')'; |
| 155 | 155 | } |
| 156 | - for ($i=0;$i<$startProcessCount;$i++) { |
|
| 156 | + for ($i = 0; $i < $startProcessCount; $i++) { |
|
| 157 | 157 | usleep(100); |
| 158 | 158 | if ($this->startProcess()) { |
| 159 | 159 | if ($this->verbose) { |
@@ -174,13 +174,13 @@ discard block |
||
| 174 | 174 | */ |
| 175 | 175 | public function startProcess() |
| 176 | 176 | { |
| 177 | - $ttl = (time() + $this->timeToLive -1); |
|
| 177 | + $ttl = (time() + $this->timeToLive - 1); |
|
| 178 | 178 | $current = $this->processRepository->countNotTimeouted($ttl); |
| 179 | - $completePath = '(' .escapeshellcmd($this->getCrawlerCliPath()) . ' &) > /dev/null'; |
|
| 179 | + $completePath = '('.escapeshellcmd($this->getCrawlerCliPath()).' &) > /dev/null'; |
|
| 180 | 180 | if (system($completePath) === false) { |
| 181 | 181 | throw new Exception('could not start process!'); |
| 182 | 182 | } else { |
| 183 | - for ($i=0;$i<10;$i++) { |
|
| 183 | + for ($i = 0; $i < 10; $i++) { |
|
| 184 | 184 | if ($this->processRepository->countNotTimeouted($ttl) > $current) { |
| 185 | 185 | return true; |
| 186 | 186 | } |
@@ -197,9 +197,9 @@ discard block |
||
| 197 | 197 | */ |
| 198 | 198 | public function getCrawlerCliPath() |
| 199 | 199 | { |
| 200 | - $phpPath = $this->crawlerObj->extensionSettings['phpPath'] . ' '; |
|
| 201 | - $pathToTypo3 = rtrim(\TYPO3\CMS\Core\Utility\GeneralUtility::getIndpEnv('TYPO3_DOCUMENT_ROOT'), '/'); |
|
| 202 | - $pathToTypo3 .= rtrim(\TYPO3\CMS\Core\Utility\GeneralUtility::getIndpEnv('TYPO3_SITE_PATH'), '/'); |
|
| 200 | + $phpPath = $this->crawlerObj->extensionSettings['phpPath'].' '; |
|
| 201 | + $pathToTypo3 = rtrim(\TYPO3\CMS\Core\Utility\GeneralUtility::getIndpEnv('TYPO3_DOCUMENT_ROOT'), '/'); |
|
| 202 | + $pathToTypo3 .= rtrim(\TYPO3\CMS\Core\Utility\GeneralUtility::getIndpEnv('TYPO3_SITE_PATH'), '/'); |
|
| 203 | 203 | $cliPart = '/typo3/cli_dispatch.phpsh crawler'; |
| 204 | 204 | return $phpPath.$pathToTypo3.$cliPart; |
| 205 | 205 | } |