Passed
Push — master ( b27fbc...b83806 )
by Aimeos
03:33
created

Standard::run()   B

Complexity

Conditions 6
Paths 14

Size

Total Lines 43
Code Lines 23

Duplication

Lines 0
Ratio 0 %

Importance

Changes 1
Bugs 0 Features 0
Metric Value
cc 6
eloc 23
c 1
b 0
f 0
nc 14
nop 0
dl 0
loc 43
rs 8.9297
1
<?php
2
3
/**
4
 * @license LGPLv3, http://opensource.org/licenses/LGPL-3.0
5
 * @copyright Aimeos (aimeos.org), 2019-2022
6
 * @package Controller
7
 * @subpackage Jobs
8
 */
9
10
11
namespace Aimeos\Controller\Jobs\Catalog\Import\Xml;
12
13
14
/**
15
 * Job controller for XML catalog imports
16
 *
17
 * @package Controller
18
 * @subpackage Jobs
19
 */
20
class Standard
21
	extends \Aimeos\Controller\Jobs\Base
22
	implements \Aimeos\Controller\Jobs\Iface
23
{
24
	/** controller/jobs/catalog/import/xml/name
25
	 * Class name of the used catalog suggestions scheduler controller implementation
26
	 *
27
	 * Each default job controller can be replace by an alternative imlementation.
28
	 * To use this implementation, you have to set the last part of the class
29
	 * name as configuration value so the controller factory knows which class it
30
	 * has to instantiate.
31
	 *
32
	 * For example, if the name of the default class is
33
	 *
34
	 *  \Aimeos\Controller\Jobs\Catalog\Import\Xml\Standard
35
	 *
36
	 * and you want to replace it with your own version named
37
	 *
38
	 *  \Aimeos\Controller\Jobs\Catalog\Import\Xml\Myxml
39
	 *
40
	 * then you have to set the this configuration option:
41
	 *
42
	 *  controller/jobs/catalog/import/xml/name = Myxml
43
	 *
44
	 * The value is the last part of your own class name and it's case sensitive,
45
	 * so take care that the configuration value is exactly named like the last
46
	 * part of the class name.
47
	 *
48
	 * The allowed characters of the class name are A-Z, a-z and 0-9. No other
49
	 * characters are possible! You should always start the last part of the class
50
	 * name with an upper case character and continue only with lower case characters
51
	 * or numbers. Avoid chamel case names like "MyXml"!
52
	 *
53
	 * @param string Last part of the class name
54
	 * @since 2019.04
55
	 */
56
57
	/** controller/jobs/catalog/import/xml/decorators/excludes
58
	 * Excludes decorators added by the "common" option from the catalog import CSV job controller
59
	 *
60
	 * Decorators extend the functionality of a class by adding new aspects
61
	 * (e.g. log what is currently done), executing the methods of the underlying
62
	 * class only in certain conditions (e.g. only for logged in users) or
63
	 * modify what is returned to the caller.
64
	 *
65
	 * This option allows you to remove a decorator added via
66
	 * "controller/jobs/common/decorators/default" before they are wrapped
67
	 * around the job controller.
68
	 *
69
	 *  controller/jobs/catalog/import/xml/decorators/excludes = array( 'decorator1' )
70
	 *
71
	 * This would remove the decorator named "decorator1" from the list of
72
	 * common decorators ("\Aimeos\Controller\Jobs\Common\Decorator\*") added via
73
	 * "controller/jobs/common/decorators/default" to the job controller.
74
	 *
75
	 * @param array List of decorator names
76
	 * @since 2019.04
77
	 * @see controller/jobs/common/decorators/default
78
	 * @see controller/jobs/catalog/import/xml/decorators/global
79
	 * @see controller/jobs/catalog/import/xml/decorators/local
80
	 */
81
82
	/** controller/jobs/catalog/import/xml/decorators/global
83
	 * Adds a list of globally available decorators only to the catalog import CSV job controller
84
	 *
85
	 * Decorators extend the functionality of a class by adding new aspects
86
	 * (e.g. log what is currently done), executing the methods of the underlying
87
	 * class only in certain conditions (e.g. only for logged in users) or
88
	 * modify what is returned to the caller.
89
	 *
90
	 * This option allows you to wrap global decorators
91
	 * ("\Aimeos\Controller\Jobs\Common\Decorator\*") around the job controller.
92
	 *
93
	 *  controller/jobs/catalog/import/xml/decorators/global = array( 'decorator1' )
94
	 *
95
	 * This would add the decorator named "decorator1" defined by
96
	 * "\Aimeos\Controller\Jobs\Common\Decorator\Decorator1" only to the job controller.
97
	 *
98
	 * @param array List of decorator names
99
	 * @since 2019.04
100
	 * @see controller/jobs/common/decorators/default
101
	 * @see controller/jobs/catalog/import/xml/decorators/excludes
102
	 * @see controller/jobs/catalog/import/xml/decorators/local
103
	 */
104
105
	/** controller/jobs/catalog/import/xml/decorators/local
106
	 * Adds a list of local decorators only to the catalog import CSV job controller
107
	 *
108
	 * Decorators extend the functionality of a class by adding new aspects
109
	 * (e.g. log what is currently done), executing the methods of the underlying
110
	 * class only in certain conditions (e.g. only for logged in users) or
111
	 * modify what is returned to the caller.
112
	 *
113
	 * This option allows you to wrap local decorators
114
	 * ("\Aimeos\Controller\Jobs\Catalog\Import\Xml\Decorator\*") around the job
115
	 * controller.
116
	 *
117
	 *  controller/jobs/catalog/import/xml/decorators/local = array( 'decorator2' )
118
	 *
119
	 * This would add the decorator named "decorator2" defined by
120
	 * "\Aimeos\Controller\Jobs\Catalog\Import\Xml\Decorator\Decorator2"
121
	 * only to the job controller.
122
	 *
123
	 * @param array List of decorator names
124
	 * @since 2019.04
125
	 * @see controller/jobs/common/decorators/default
126
	 * @see controller/jobs/catalog/import/xml/decorators/excludes
127
	 * @see controller/jobs/catalog/import/xml/decorators/global
128
	 */
129
130
131
	use \Aimeos\Controller\Common\Common\Import\Traits;
132
	use \Aimeos\Controller\Common\Common\Import\Xml\Traits;
133
134
135
	/**
136
	 * Returns the localized name of the job.
137
	 *
138
	 * @return string Name of the job
139
	 */
140
	public function getName() : string
141
	{
142
		return $this->context()->translate( 'controller/jobs', 'Catalog import XML' );
143
	}
144
145
146
	/**
147
	 * Returns the localized description of the job.
148
	 *
149
	 * @return string Description of the job
150
	 */
151
	public function getDescription() : string
152
	{
153
		return $this->context()->translate( 'controller/jobs', 'Imports new and updates existing categories from XML files' );
154
	}
155
156
157
	/**
158
	 * Executes the job.
159
	 *
160
	 * @throws \Aimeos\Controller\Jobs\Exception If an error occurs
161
	 */
162
	public function run()
163
	{
164
		$context = $this->context();
165
		$logger = $context->logger();
166
		$process = $context->process();
167
168
		$location = $this->location();
169
		$fs = $context->fs( 'fs-import' );
170
171
		if( $fs->isDir( $location ) === false ) {
172
			return;
173
		}
174
175
		try
176
		{
177
			$logger->info( sprintf( 'Started catalog import from "%1$s"', $location ), 'import/xml/catalog' );
178
179
			$fcn = function( \Aimeos\MShop\ContextIface $context, string $path ) {
180
				$this->import( $context, $path );
181
			};
182
183
			foreach( map( $fs->scan( $location ) )->sort() as $filename )
184
			{
185
				$path = $location . '/' . $filename;
186
187
				if( $fs instanceof \Aimeos\Base\Filesystem\DirIface && $fs->isDir( $path ) ) {
188
					continue;
189
				}
190
191
				$process->start( $fcn, [$context, $fs->readf( $path )] );
192
			}
193
194
			$process->wait();
195
196
			$context->process()->wait();
197
198
			$logger->info( sprintf( 'Finished catalog import from "%1$s"', $location ), 'import/xml/catalog' );
199
		}
200
		catch( \Exception $e )
201
		{
202
			$logger->error( 'Catalog import error: ' . $e->getMessage() . "\n" . $e->getTraceAsString(), 'import/xml/catalog' );
203
			$this->mail( 'Catalog XML import error', $e->getMessage() . "\n" . $e->getTraceAsString() );
204
			throw $e;
205
		}
206
	}
207
208
209
	/**
210
	 * Returns the directory for storing imported files
211
	 *
212
	 * @return string Directory for storing imported files
213
	 */
214
	protected function backup() : string
215
	{
216
		/** controller/jobs/catalog/import/xml/backup
217
		 * Name of the backup for sucessfully imported files
218
		 *
219
		 * After a XML file was imported successfully, you can move it to another
220
		 * location, so it won't be imported again and isn't overwritten by the
221
		 * next file that is stored at the same location in the file system.
222
		 *
223
		 * You should use an absolute path to be sure but can be relative path
224
		 * if you absolutely know from where the job will be executed from. The
225
		 * name of the new backup location can contain placeholders understood
226
		 * by the PHP DateTime::format() method (with percent signs prefix) to
227
		 * create dynamic paths, e.g. "backup/%Y-%m-%d" which would create
228
		 * "backup/2000-01-01". For more information about the date() placeholders,
229
		 * please have a look  into the PHP documentation of the
230
		 * {@link https://www.php.net/manual/en/datetime.format.php format() method}.
231
		 *
232
		 * **Note:** If no backup name is configured, the file or directory
233
		 * won't be moved away. Please make also sure that the parent directory
234
		 * and the new directory are writable so the file or directory could be
235
		 * moved.
236
		 *
237
		 * @param integer Name of the backup file, optionally with date/time placeholders
238
		 * @since 2019.04
239
		 * @see controller/jobs/catalog/import/xml/domains
240
		 * @see controller/jobs/catalog/import/xml/location
241
		 * @see controller/jobs/catalog/import/xml/max-query
242
		 */
243
		return (string) $this->context()->config()->get( 'controller/jobs/catalog/import/xml/backup' );
244
	}
245
246
247
	/**
248
	 * Returns the list of domain names that should be retrieved along with the catalog items
249
	 *
250
	 * @return array List of domain names
251
	 */
252
	protected function domains() : array
253
	{
254
		/** controller/jobs/catalog/import/xml/domains
255
		 * List of item domain names that should be retrieved along with the catalog items
256
		 *
257
		 * For efficient processing, the items associated to the products can be
258
		 * fetched to, minimizing the number of database queries required. To be
259
		 * most effective, the list of item domain names should be used in the
260
		 * mapping configuration too, so the retrieved items will be used during
261
		 * the import.
262
		 *
263
		 * @param array Associative list of MShop item domain names
264
		 * @since 2019.04
265
		 * @see controller/jobs/catalog/import/xml/backup
266
		 * @see controller/jobs/catalog/import/xml/location
267
		 * @see controller/jobs/catalog/import/xml/max-query
268
		 */
269
		return $this->context()->config()->get( 'controller/jobs/catalog/import/xml/domains', ['media', 'text'] );
270
	}
271
272
273
	/**
274
	 * Imports the XML file given by its path
275
	 *
276
	 * @param \Aimeos\MShop\ContextIface $context Context object
277
	 * @param string $filename Absolute or relative path to the XML file
278
	 */
279
	protected function import( \Aimeos\MShop\ContextIface $context, string $filename )
280
	{
281
		$logger = $context->logger();
282
		$xml = new \XMLReader();
283
284
		if( $xml->open( $filename, LIBXML_COMPACT | LIBXML_PARSEHUGE ) === false ) {
285
			throw new \Aimeos\Controller\Jobs\Exception( sprintf( 'No XML file "%1$s" found', $filename ) );
286
		}
287
288
		$logger->info( sprintf( 'Started catalog import from file "%1$s"', $filename ), 'import/xml/catalog' );
289
290
		$this->importTree( $xml, $this->domains() );
291
		$this->saveTypes();
292
293
		foreach( $this->getProcessors() as $proc ) {
294
			$proc->finish();
295
		}
296
297
		unlink( $filename );
298
299
		$logger->info( sprintf( 'Finished catalog import from file "%1$s"', $filename ), 'import/xml/catalog' );
300
301
		if( !empty( $backup = $this->backup() ) && @rename( $filename, $backup = \Aimeos\Base\Str::strtime( $backup ) ) === false )
302
		{
303
			$msg = sprintf( 'Unable to move imported file "%1$s" to "%2$s"', $filename, $backup );
304
			throw new \Aimeos\Controller\Jobs\Exception( $msg );
305
		}
306
	}
307
308
309
	/**
310
	 * Imports a single category node
311
	 *
312
	 * @param \DomElement $node DOM node of "catalogitem" element
313
	 * @param string[] $domains List of domain names whose referenced items will be updated in the catalog items
314
	 * @param string|null $parentid ID of the parent catalog node
315
	 * @param array &$map Will contain the associative list of code/ID pairs of the child categories
316
	 * @return string Catalog ID of the imported category
317
	 */
318
	protected function importNode( \DomElement $node, array $domains, string $parentid = null, array &$map ) : string
319
	{
320
		$manager = \Aimeos\MShop::create( $this->context(), 'catalog' );
321
322
		if( ( $attr = $node->attributes->getNamedItem( 'ref' ) ) !== null )
0 ignored issues
show
Bug introduced by
The method getNamedItem() does not exist on null. ( Ignorable by Annotation )

If this is a false-positive, you can also ignore this issue in your code via the ignore-call  annotation

322
		if( ( $attr = $node->attributes->/** @scrutinizer ignore-call */ getNamedItem( 'ref' ) ) !== null )

This check looks for calls to methods that do not seem to exist on a given type. It looks for the method on the type itself as well as in inherited classes or implemented interfaces.

This is most likely a typographical error or the method has been renamed.

Loading history...
323
		{
324
			try
325
			{
326
				$item = $manager->find( $attr->nodeValue, $domains );
327
				$manager->move( $item->getId(), $item->getParentId(), $parentid );
328
329
				$item = $this->process( $item, $node );
330
				$currentid = $manager->save( $item )->getId();
331
				unset( $item );
332
333
				$tree = $manager->getTree( $currentid, [], \Aimeos\MW\Tree\Manager\Base::LEVEL_LIST );
334
335
				foreach( $tree->getChildren() as $child ) {
336
					$map[$child->getCode()] = $child->getId();
337
				}
338
339
				return $currentid;
340
			}
341
			catch( \Aimeos\MShop\Exception $e ) {} // not found, create new
342
		}
343
344
		$item = $this->process( $manager->create(), $node );
345
		return $manager->insert( $item, $parentid )->getId();
346
	}
347
348
349
	/**
350
	 * Imports the catalog document
351
	 *
352
	 * @param \XMLReader $xml Catalog document to import
353
	 * @param string[] $domains List of domain names whose referenced items will be updated in the catalog items
354
	 * @param string|null $parentid ID of the parent catalog node
355
	 * @param array $map Associative list of catalog code as keys and category ID as values
356
	 */
357
	protected function importTree( \XMLReader $xml, array $domains, string $parentid = null, array $map = [] )
358
	{
359
		$total = 0;
360
		$childMap = [];
361
		$currentid = $parentid;
362
363
		while( $xml->read() === true )
364
		{
365
			if( $xml->nodeType === \XMLReader::ELEMENT && $xml->name === 'catalogitem' )
366
			{
367
				if( ( $node = $xml->expand() ) === false )
368
				{
369
					$msg = sprintf( 'Expanding "%1$s" node failed', 'catalogitem' );
370
					throw new \Aimeos\Controller\Jobs\Exception( $msg );
371
				}
372
373
				if( ( $attr = $node->attributes->getNamedItem( 'ref' ) ) !== null ) {
374
					unset( $map[$attr->nodeValue] );
375
				}
376
377
				$currentid = $this->importNode( $node, $domains, $parentid, $childMap );
378
				$total++;
379
			}
380
			elseif( $xml->nodeType === \XMLReader::ELEMENT && $xml->name === 'catalog' )
381
			{
382
				$this->importTree( $xml, $domains, $currentid, $childMap );
383
				$childMap = [];
384
			}
385
			elseif( $xml->nodeType === \XMLReader::END_ELEMENT && $xml->name === 'catalog' )
386
			{
387
				\Aimeos\MShop::create( $this->context(), 'catalog' )->delete( $map );
388
				break;
389
			}
390
		}
391
	}
392
393
394
	/**
395
	 * Returns the path to the directory with the XML file
396
	 *
397
	 * @return string Path to the directory with the XML file
398
	 */
399
	protected function location() : string
400
	{
401
		/** controller/jobs/catalog/import/xml/location
402
		 * File or directory where the content is stored which should be imported
403
		 *
404
		 * You need to configure the XML file or directory with the XML files that
405
		 * should be imported. It should be an absolute path to be sure but can be
406
		 * relative path if you absolutely know from where the job will be executed
407
		 * from.
408
		 *
409
		 * @param string Relative path to the XML files
410
		 * @since 2019.04
411
		 * @see controller/jobs/catalog/import/xml/backup
412
		 * @see controller/jobs/catalog/import/xml/domains
413
		 * @see controller/jobs/catalog/import/xml/max-query
414
		 */
415
		return (string) $this->context()->config()->get( 'controller/jobs/catalog/import/xml/location', 'catalog' );
416
	}
417
418
419
	/**
420
	 * Updates the catalog item and its referenced items using the given DOM node
421
	 *
422
	 * @param \Aimeos\MShop\Catalog\Item\Iface $item Catalog item object to update
423
	 * @param \DomElement $node DOM node used for updateding the catalog item
424
	 * @return \Aimeos\MShop\Catalog\Item\Iface $item Updated catalog item object
425
	 */
426
	protected function process( \Aimeos\MShop\Catalog\Item\Iface $item, \DomElement $node ) : \Aimeos\MShop\Catalog\Item\Iface
427
	{
428
		try
429
		{
430
			$list = [];
431
432
			foreach( $node->attributes as $attr ) {
433
				$list[$attr->nodeName] = $attr->nodeValue;
434
			}
435
436
			foreach( $node->childNodes as $tag )
437
			{
438
				if( $tag->nodeName === 'lists' ) {
439
					$item = $this->getProcessor( $tag->nodeName )->process( $item, $tag );
440
				} elseif( $tag->nodeName[0] !== '#' ) {
441
					$list[$tag->nodeName] = $tag->nodeValue;
442
				}
443
			}
444
445
			$list['catalog.config'] = isset( $list['catalog.config'] ) ? json_decode( $list['catalog.config'], true ) : [];
446
			$item->fromArray( $list, true );
447
		}
448
		catch( \Exception $e )
449
		{
450
			$msg = 'Catalog import error: ' . $e->getMessage() . "\n" . $e->getTraceAsString();
451
			$this->context()->logger()->error( $msg, 'import/xml/catalog' );
452
		}
453
454
		return $item;
455
	}
456
}
457