Passed
Push — master ( 330c3c...aa616b )
by Aimeos
03:14
created

Standard::import()   B

Complexity

Conditions 6
Paths 23

Size

Total Lines 49
Code Lines 26

Duplication

Lines 0
Ratio 0 %

Importance

Changes 1
Bugs 0 Features 0
Metric Value
cc 6
eloc 26
c 1
b 0
f 0
nc 23
nop 5
dl 0
loc 49
rs 8.8817
1
<?php
2
3
/**
4
 * @license LGPLv3, http://opensource.org/licenses/LGPL-3.0
5
 * @copyright Aimeos (aimeos.org), 2015-2022
6
 * @package Controller
7
 * @subpackage Jobs
8
 */
9
10
11
namespace Aimeos\Controller\Jobs\Product\Import\Csv;
12
13
14
/**
15
 * Job controller for CSV product imports.
16
 *
17
 * @package Controller
18
 * @subpackage Jobs
19
 */
20
class Standard
21
	extends \Aimeos\Controller\Common\Product\Import\Csv\Base
22
	implements \Aimeos\Controller\Jobs\Iface
23
{
24
	/** controller/jobs/product/import/csv/name
25
	 * Class name of the used product suggestions scheduler controller implementation
26
	 *
27
	 * Each default job controller can be replace by an alternative imlementation.
28
	 * To use this implementation, you have to set the last part of the class
29
	 * name as configuration value so the controller factory knows which class it
30
	 * has to instantiate.
31
	 *
32
	 * For example, if the name of the default class is
33
	 *
34
	 *  \Aimeos\Controller\Jobs\Product\Import\Csv\Standard
35
	 *
36
	 * and you want to replace it with your own version named
37
	 *
38
	 *  \Aimeos\Controller\Jobs\Product\Import\Csv\Mycsv
39
	 *
40
	 * then you have to set the this configuration option:
41
	 *
42
	 *  controller/jobs/product/import/csv/name = Mycsv
43
	 *
44
	 * The value is the last part of your own class name and it's case sensitive,
45
	 * so take care that the configuration value is exactly named like the last
46
	 * part of the class name.
47
	 *
48
	 * The allowed characters of the class name are A-Z, a-z and 0-9. No other
49
	 * characters are possible! You should always start the last part of the class
50
	 * name with an upper case character and continue only with lower case characters
51
	 * or numbers. Avoid chamel case names like "MyCsv"!
52
	 *
53
	 * @param string Last part of the class name
54
	 * @since 2015.01
55
	 */
56
57
	/** controller/jobs/product/import/csv/decorators/excludes
58
	 * Excludes decorators added by the "common" option from the product import CSV job controller
59
	 *
60
	 * Decorators extend the functionality of a class by adding new aspects
61
	 * (e.g. log what is currently done), executing the methods of the underlying
62
	 * class only in certain conditions (e.g. only for logged in users) or
63
	 * modify what is returned to the caller.
64
	 *
65
	 * This option allows you to remove a decorator added via
66
	 * "controller/jobs/common/decorators/default" before they are wrapped
67
	 * around the job controller.
68
	 *
69
	 *  controller/jobs/product/import/csv/decorators/excludes = array( 'decorator1' )
70
	 *
71
	 * This would remove the decorator named "decorator1" from the list of
72
	 * common decorators ("\Aimeos\Controller\Jobs\Common\Decorator\*") added via
73
	 * "controller/jobs/common/decorators/default" to the job controller.
74
	 *
75
	 * @param array List of decorator names
76
	 * @since 2015.01
77
	 * @see controller/jobs/common/decorators/default
78
	 * @see controller/jobs/product/import/csv/decorators/global
79
	 * @see controller/jobs/product/import/csv/decorators/local
80
	 */
81
82
	/** controller/jobs/product/import/csv/decorators/global
83
	 * Adds a list of globally available decorators only to the product import CSV job controller
84
	 *
85
	 * Decorators extend the functionality of a class by adding new aspects
86
	 * (e.g. log what is currently done), executing the methods of the underlying
87
	 * class only in certain conditions (e.g. only for logged in users) or
88
	 * modify what is returned to the caller.
89
	 *
90
	 * This option allows you to wrap global decorators
91
	 * ("\Aimeos\Controller\Jobs\Common\Decorator\*") around the job controller.
92
	 *
93
	 *  controller/jobs/product/import/csv/decorators/global = array( 'decorator1' )
94
	 *
95
	 * This would add the decorator named "decorator1" defined by
96
	 * "\Aimeos\Controller\Jobs\Common\Decorator\Decorator1" only to the job controller.
97
	 *
98
	 * @param array List of decorator names
99
	 * @since 2015.01
100
	 * @see controller/jobs/common/decorators/default
101
	 * @see controller/jobs/product/import/csv/decorators/excludes
102
	 * @see controller/jobs/product/import/csv/decorators/local
103
	 */
104
105
	/** controller/jobs/product/import/csv/decorators/local
106
	 * Adds a list of local decorators only to the product import CSV job controller
107
	 *
108
	 * Decorators extend the functionality of a class by adding new aspects
109
	 * (e.g. log what is currently done), executing the methods of the underlying
110
	 * class only in certain conditions (e.g. only for logged in users) or
111
	 * modify what is returned to the caller.
112
	 *
113
	 * This option allows you to wrap local decorators
114
	 * ("\Aimeos\Controller\Jobs\Product\Import\Csv\Decorator\*") around the job
115
	 * controller.
116
	 *
117
	 *  controller/jobs/product/import/csv/decorators/local = array( 'decorator2' )
118
	 *
119
	 * This would add the decorator named "decorator2" defined by
120
	 * "\Aimeos\Controller\Jobs\Product\Import\Csv\Decorator\Decorator2"
121
	 * only to the job controller.
122
	 *
123
	 * @param array List of decorator names
124
	 * @since 2015.01
125
	 * @see controller/jobs/common/decorators/default
126
	 * @see controller/jobs/product/import/csv/decorators/excludes
127
	 * @see controller/jobs/product/import/csv/decorators/global
128
	 */
129
130
131
	private $types;
132
133
134
	/**
135
	 * Returns the localized name of the job.
136
	 *
137
	 * @return string Name of the job
138
	 */
139
	public function getName() : string
140
	{
141
		return $this->context()->translate( 'controller/jobs', 'Product import CSV' );
142
	}
143
144
145
	/**
146
	 * Returns the localized description of the job.
147
	 *
148
	 * @return string Description of the job
149
	 */
150
	public function getDescription() : string
151
	{
152
		return $this->context()->translate( 'controller/jobs', 'Imports new and updates existing products from CSV files' );
153
	}
154
155
156
	/**
157
	 * Executes the job.
158
	 *
159
	 * @throws \Aimeos\Controller\Jobs\Exception If an error occurs
160
	 */
161
	public function run()
162
	{
163
		$context = $this->context();
164
		$logger = $context->logger();
165
166
		try
167
		{
168
			$location = $this->location();
169
			$fs = $context->fs( 'fs-import' );
170
171
			if( $fs->isDir( $location ) === false ) {
172
				return;
173
			}
174
175
			$maxcnt = $this->max();
176
			$skiplines = $this->skip();
177
			$domains = $this->domains();
178
179
			$mappings = $this->mapping();
180
			$processor = $this->getProcessors( $mappings );
181
			$codePos = $this->getCodePosition( $mappings['item'] );
182
183
			foreach( map( $fs->scan( $location ) )->sort() as $filename )
184
			{
185
				$path = $location . '/' . $filename;
186
187
				if( $fs instanceof \Aimeos\Base\Filesystem\DirIface && $fs->isDir( $path ) ) {
188
					continue;
189
				}
190
191
				$logger->info( sprintf( 'Started product import from "%1$s"', $path ), 'import/csv/product' );
192
193
				$total = $errors = 0;
194
				$fh = $fs->reads( $path );
195
196
				for( $i = 0; $i < $skiplines; $i++ ) {
197
					fgetcsv( $fh );
198
				}
199
200
				while( ( $data = $this->getData( $fh, $maxcnt, $codePos ) ) !== [] )
201
				{
202
					$products = $this->getProducts( array_keys( $data ), $domains );
203
					$errors += $this->import( $products, $data, $mappings['item'], [], $processor );
204
205
					$total += count( $data );
206
					unset( $products, $data );
207
				}
208
209
				fclose( $fh );
210
211
				$str = sprintf( 'Finished product import from "%1$s" (%2$d/%3$d)', $path, $errors, $total );
212
				$logger->info( $str, 'import/csv/product' );
213
214
215
				if( !empty( $backup = $this->backup() ) ) {
216
					$fs->move( $path, $backup );
217
				} else {
218
					$fs->rm( $path );
219
				}
220
221
				if( $errors > 0 ) {
222
					$this->mail( 'Product CSV import', sprintf( 'Invalid product lines in "%1$s": %2$d/%3$d', $path, $errors, $total ) );
223
				}
224
			}
225
226
			$processor->finish();
227
		}
228
		catch( \Exception $e )
229
		{
230
			$logger->error( 'Product import error: ' . $e->getMessage() . "\n" . $e->getTraceAsString(), 'import/csv/product' );
231
			$this->mail( 'Product CSV import error', $e->getMessage() . "\n" . $e->getTraceAsString() );
232
			throw new \Aimeos\Controller\Jobs\Exception( $e->getMessage() );
233
		}
234
	}
235
236
237
	/**
238
	 * Returns the directory for storing imported files
239
	 *
240
	 * @return string Directory for storing imported files
241
	 */
242
	protected function backup() : string
243
	{
244
		/** controller/jobs/product/import/csv/backup
245
		 * Name of the backup for sucessfully imported files
246
		 *
247
		 * After a CSV file was imported successfully, you can move it to another
248
		 * location, so it won't be imported again and isn't overwritten by the
249
		 * next file that is stored at the same location in the file system.
250
		 *
251
		 * You should use an absolute path to be sure but can be relative path
252
		 * if you absolutely know from where the job will be executed from. The
253
		 * name of the new backup location can contain placeholders understood
254
		 * by the PHP DateTime::format() method (with percent signs prefix) to
255
		 * create dynamic paths, e.g. "backup/%Y-%m-%d" which would create
256
		 * "backup/2000-01-01". For more information about the date() placeholders,
257
		 * please have a look  into the PHP documentation of the
258
		 * {@link https://www.php.net/manual/en/datetime.format.php format() method}.
259
		 *
260
		 * **Note:** If no backup name is configured, the file will be removed!
261
		 *
262
		 * @param integer Name of the backup file, optionally with date/time placeholders
263
		 * @since 2018.04
264
		 * @see controller/jobs/product/import/csv/domains
265
		 * @see controller/jobs/product/import/csv/location
266
		 * @see controller/jobs/product/import/csv/mapping
267
		 * @see controller/jobs/product/import/csv/max-size
268
		 * @see controller/jobs/product/import/csv/skip-lines
269
		 */
270
		$backup = $this->context()->config()->get( 'controller/jobs/product/import/csv/backup' );
271
		return \Aimeos\Base\Str::strtime( (string) $backup );
272
	}
273
274
275
	/**
276
	 * Checks the given product type for validity
277
	 *
278
	 * @param string|null $type Product type or null for no type
279
	 * @return string New product type
280
	 */
281
	protected function checkType( string $type = null ) : string
282
	{
283
		if( !isset( $this->types ) )
284
		{
285
			$this->types = [];
286
287
			$manager = \Aimeos\MShop::create( $this->context(), 'product/type' );
288
			$search = $manager->filter()->slice( 0, 10000 );
289
290
			foreach( $manager->search( $search ) as $item ) {
291
				$this->types[$item->getCode()] = $item->getCode();
292
			}
293
		}
294
295
		return ( isset( $this->types[$type] ) ? $this->types[$type] : 'default' );
296
	}
297
298
299
	/**
300
	 * Returns the list of domain names that should be retrieved along with the attribute items
301
	 *
302
	 * @return array List of domain names
303
	 */
304
	protected function domains() : array
305
	{
306
		/** controller/jobs/product/import/csv/domains
307
		 * List of item domain names that should be retrieved along with the product items
308
		 *
309
		 * For efficient processing, the items associated to the products can be
310
		 * fetched to, minimizing the number of database queries required. To be
311
		 * most effective, the list of item domain names should be used in the
312
		 * mapping configuration too, so the retrieved items will be used during
313
		 * the import.
314
		 *
315
		 * @param array Associative list of MShop item domain names
316
		 * @since 2018.04
317
		 * @see controller/jobs/product/import/csv/backup
318
		 * @see controller/jobs/product/import/csv/location
319
		 * @see controller/jobs/product/import/csv/mapping
320
		 * @see controller/jobs/product/import/csv/max-size
321
		 * @see controller/jobs/product/import/csv/skip-lines
322
		 */
323
		return $this->context()->config()->get( 'controller/jobs/product/import/csv/domains', ['media', 'text'] );
324
	}
325
326
327
	/**
328
	 * Returns the position of the "product.code" column from the product item mapping
329
	 *
330
	 * @param array $mapping Mapping of the "item" columns with position as key and code as value
331
	 * @return int Position of the "product.code" column
332
	 * @throws \Aimeos\Controller\Jobs\Exception If no mapping for "product.code" is found
333
	 */
334
	protected function getCodePosition( array $mapping ) : int
335
	{
336
		foreach( $mapping as $pos => $key )
337
		{
338
			if( $key === 'product.code' ) {
339
				return $pos;
340
			}
341
		}
342
343
		throw new \Aimeos\Controller\Jobs\Exception( sprintf( 'No "product.code" column in CSV mapping found' ) );
344
	}
345
346
347
	/**
348
	 * Returns the product items for the given codes
349
	 *
350
	 * @param array $codes List of product codes
351
	 * @param array $domains List of domains whose items should be fetched too
352
	 * @return \Aimeos\Map Associative list of product codes as key and product items as value
353
	 */
354
	protected function getProducts( array $codes, array $domains ) : \Aimeos\Map
355
	{
356
		$manager = \Aimeos\MShop::create( $this->context(), 'product' );
357
		$search = $manager->filter()->add( ['product.code' => $codes] )->slice( 0, count( $codes ) );
358
359
		return $manager->search( $search, $domains )->col( null, 'product.code' );
360
	}
361
362
363
	/**
364
	 * Imports the CSV data and creates new products or updates existing ones
365
	 *
366
	 * @param \Aimeos\Map $products List of products items implementing \Aimeos\MShop\Product\Item\Iface
367
	 * @param array $data Associative list of import data as index/value pairs
368
	 * @param array $mapping Associative list of positions and domain item keys
369
	 * @param array $types List of allowed product type codes
370
	 * @param \Aimeos\Controller\Common\Product\Import\Csv\Processor\Iface $processor Processor object
371
	 * @return int Number of products that couldn't be imported
372
	 * @throws \Aimeos\Controller\Jobs\Exception
373
	 */
374
	protected function import( \Aimeos\Map $products, array $data, array $mapping, array $types,
375
		\Aimeos\Controller\Common\Product\Import\Csv\Processor\Iface $processor ) : int
376
	{
377
		$items = [];
378
		$errors = 0;
379
		$context = $this->context();
380
		$manager = \Aimeos\MShop::create( $context, 'index' );
381
382
		foreach( $data as $code => $list )
383
		{
384
			$manager->begin();
385
386
			try
387
			{
388
				$code = trim( $code );
389
				$product = $products[$code] ?? $manager->create();
390
				$map = current( $this->getMappedChunk( $list, $mapping ) ); // there can only be one chunk for the base product data
391
392
				if( $map )
393
				{
394
					$type = $this->checkType( $this->val( $map, 'product.type', $product->getType() ) );
395
396
					if( $config = $this->val( $map, 'product.config' ) ) {
397
						$map['product.config'] = json_decode( $config ) ?: [];
398
					}
399
400
					$product = $product->fromArray( $map, true );
401
					$product = $manager->save( $product->setType( $type ) );
402
403
					$processor->process( $product, $list );
0 ignored issues
show
Bug introduced by
It seems like $product can also be of type Aimeos\Map; however, parameter $product of Aimeos\Controller\Common...cessor\Iface::process() does only seem to accept Aimeos\MShop\Product\Item\Iface, maybe add an additional type check? ( Ignorable by Annotation )

If this is a false-positive, you can also ignore this issue in your code via the ignore-type  annotation

403
					$processor->process( /** @scrutinizer ignore-type */ $product, $list );
Loading history...
404
405
					$product = $manager->save( $product );
406
					$items[$product->getId()] = $product;
407
				}
408
409
				$manager->commit();
410
			}
411
			catch( \Exception $e )
412
			{
413
				$manager->rollback();
414
415
				$msg = sprintf( 'Unable to import product with code "%1$s": %2$s', $code, $e->getMessage() );
416
				$context->logger()->error( $msg, 'import/csv/product' );
417
418
				$errors++;
419
			}
420
		}
421
422
		return $errors;
423
	}
424
425
426
	/**
427
	 * Returns the path to the directory with the CSV file
428
	 *
429
	 * @return string Path to the directory with the CSV file
430
	 */
431
	protected function location() : string
432
	{
433
		/** controller/jobs/product/import/csv/location
434
		 * File or directory where the content is stored which should be imported
435
		 *
436
		 * You need to configure the CSV file or directory with the CSV files that
437
		 * should be imported. It should be an absolute path to be sure but can be
438
		 * relative path if you absolutely know from where the job will be executed
439
		 * from.
440
		 *
441
		 * @param string Relative path to the CSV files
442
		 * @since 2015.08
443
		 * @see controller/jobs/product/import/csv/backup
444
		 * @see controller/jobs/product/import/csv/domains
445
		 * @see controller/jobs/product/import/csv/location
446
		 * @see controller/jobs/product/import/csv/mapping
447
		 * @see controller/jobs/product/import/csv/max-size
448
		 * @see controller/jobs/product/import/csv/skip-lines
449
		 */
450
		return (string) $this->context()->config()->get( 'controller/jobs/product/import/csv/location', 'product' );
451
	}
452
453
454
	/**
455
	 * Returns the CSV column mapping
456
	 *
457
	 * @return array CSV column mapping
458
	 */
459
	protected function mapping() : array
460
	{
461
		/** controller/jobs/product/import/csv/mapping
462
		 * List of mappings between the position in the CSV file and item keys
463
		 *
464
		 * The importer have to know which data is at which position in the CSV
465
		 * file. Therefore, you need to specify a mapping between each position
466
		 * and the MShop domain item key (e.g. "product.code") it represents.
467
		 *
468
		 * You can use all domain item keys which are used in the fromArray()
469
		 * methods of the item classes.
470
		 *
471
		 * These mappings are grouped together by their processor names, which
472
		 * are responsible for importing the data, e.g. all mappings in "item"
473
		 * will be processed by the base product importer while the mappings in
474
		 * "text" will be imported by the text processor.
475
		 *
476
		 * @param array Associative list of processor names and lists of key/position pairs
477
		 * @since 2018.04
478
		 * @see controller/jobs/product/import/csv/backup
479
		 * @see controller/jobs/product/import/csv/domains
480
		 * @see controller/jobs/product/import/csv/location
481
		 * @see controller/jobs/product/import/csv/max-size
482
		 * @see controller/jobs/product/import/csv/skip-lines
483
		 */
484
		$map = (array) $this->context()->config()->get( 'controller/jobs/product/import/csv/mapping', $this->getDefaultMapping() );
485
486
		if( !isset( $map['item'] ) || !is_array( $map['item'] ) )
487
		{
488
			$msg = sprintf( 'Required mapping key "%1$s" is missing or contains no array', 'item' );
489
			throw new \Aimeos\Controller\Jobs\Exception( $msg );
490
		}
491
492
		return $map;
493
	}
494
495
496
	/**
497
	 * Returns the maximum number of CSV rows to import at once
498
	 *
499
	 * @return int Maximum number of CSV rows to import at once
500
	 */
501
	protected function max() : int
502
	{
503
		/** controller/jobs/product/import/csv/max-size
504
		 * Maximum number of CSV rows to import at once
505
		 *
506
		 * It's more efficient to read and import more than one row at a time
507
		 * to speed up the import. Usually, the bigger the chunk that is imported
508
		 * at once, the less time the importer will need. The downside is that
509
		 * the amount of memory required by the import process will increase as
510
		 * well. Therefore, it's a trade-off between memory consumption and
511
		 * import speed.
512
		 *
513
		 * @param integer Number of rows
514
		 * @since 2018.04
515
		 * @see controller/jobs/product/import/csv/backup
516
		 * @see controller/jobs/product/import/csv/domains
517
		 * @see controller/jobs/product/import/csv/location
518
		 * @see controller/jobs/product/import/csv/mapping
519
		 * @see controller/jobs/product/import/csv/skip-lines
520
		 */
521
		return (int) $this->context()->config()->get( 'controller/jobs/product/import/csv/max-size', 1000 );
522
	}
523
524
525
	/**
526
	 * Returns the number of rows skipped in front of each CSV files
527
	 *
528
	 * @return int Number of rows skipped in front of each CSV files
529
	 */
530
	protected function skip() : int
531
	{
532
		/** controller/jobs/product/import/csv/skip-lines
533
		 * Number of rows skipped in front of each CSV files
534
		 *
535
		 * Some CSV files contain header information describing the content of
536
		 * the column values. These data is for informational purpose only and
537
		 * can't be imported into the database. Using this option, you can
538
		 * define the number of lines that should be left out before the import
539
		 * begins.
540
		 *
541
		 * @param integer Number of rows
542
		 * @since 2015.08
543
		 * @see controller/jobs/product/import/csv/backup
544
		 * @see controller/jobs/product/import/csv/domains
545
		 * @see controller/jobs/product/import/csv/location
546
		 * @see controller/jobs/product/import/csv/mapping
547
		 * @see controller/jobs/product/import/csv/max-size
548
		 */
549
		return (int) $this->context()->config()->get( 'controller/jobs/product/import/csv/skip-lines', 0 );
550
	}
551
}
552