Total Complexity | 47 |
Total Lines | 435 |
Duplicated Lines | 0 % |
Changes | 0 |
Complex classes like GedcomExportService often do a lot of different things. To break such a class down, we need to identify a cohesive component within that class. A common approach to find such a component is to look for fields/methods that share the same prefixes, or suffixes.
Once you have determined the fields that belong together, you can apply the Extract Class refactoring. If the component makes sense as a sub-class, Extract Subclass is also a candidate, and is often faster.
While breaking up the class, it is a good idea to analyze how other classes use GedcomExportService, and based on these observations, apply Extract Interface, too.
1 | <?php |
||
73 | class GedcomExportService |
||
74 | { |
||
75 | private const ACCESS_LEVELS = [ |
||
76 | 'gedadmin' => Auth::PRIV_NONE, |
||
77 | 'user' => Auth::PRIV_USER, |
||
78 | 'visitor' => Auth::PRIV_PRIVATE, |
||
79 | 'none' => Auth::PRIV_HIDE, |
||
80 | ]; |
||
81 | |||
82 | private ResponseFactoryInterface $response_factory; |
||
83 | |||
84 | private StreamFactoryInterface $stream_factory; |
||
85 | |||
86 | /** |
||
87 | * @param ResponseFactoryInterface $response_factory |
||
88 | * @param StreamFactoryInterface $stream_factory |
||
89 | */ |
||
90 | public function __construct(ResponseFactoryInterface $response_factory, StreamFactoryInterface $stream_factory) |
||
91 | { |
||
92 | $this->response_factory = $response_factory; |
||
93 | $this->stream_factory = $stream_factory; |
||
94 | } |
||
95 | |||
96 | /** |
||
97 | * @param Tree $tree - Export data from this tree |
||
98 | * @param bool $sort_by_xref - Write GEDCOM records in XREF order |
||
99 | * @param string $encoding - Convert from UTF-8 to other encoding |
||
100 | * @param string $privacy - Filter records by role |
||
101 | * @param string $filename - Name of download file, without an extension |
||
102 | * @param string $format - One of: gedcom, zip, zipmedia, gedzip |
||
103 | * |
||
104 | * @return ResponseInterface |
||
105 | */ |
||
106 | public function downloadResponse( |
||
107 | Tree $tree, |
||
108 | bool $sort_by_xref, |
||
109 | string $encoding, |
||
110 | string $privacy, |
||
111 | string $line_endings, |
||
112 | string $filename, |
||
113 | string $format, |
||
114 | Collection $records = null |
||
115 | ): ResponseInterface { |
||
116 | $access_level = self::ACCESS_LEVELS[$privacy]; |
||
117 | |||
118 | if ($format === 'gedcom') { |
||
119 | $resource = $this->export($tree, $sort_by_xref, $encoding, $access_level, $line_endings, $records); |
||
120 | $stream = $this->stream_factory->createStreamFromResource($resource); |
||
121 | |||
122 | return $this->response_factory->createResponse() |
||
123 | ->withBody($stream) |
||
124 | ->withHeader('content-type', 'text/x-gedcom; charset=' . UTF8::NAME) |
||
125 | ->withHeader('content-disposition', 'attachment; filename="' . addcslashes($filename, '"') . '.ged"'); |
||
126 | } |
||
127 | |||
128 | // Create a new/empty .ZIP file |
||
129 | $temp_zip_file = stream_get_meta_data(tmpfile())['uri']; |
||
130 | $zip_provider = new FilesystemZipArchiveProvider($temp_zip_file, 0755); |
||
131 | $zip_adapter = new ZipArchiveAdapter($zip_provider); |
||
132 | $zip_filesystem = new Filesystem($zip_adapter); |
||
133 | |||
134 | if ($format === 'zipmedia') { |
||
135 | $media_path = $tree->getPreference('MEDIA_DIRECTORY'); |
||
136 | } elseif ($format === 'gedzip') { |
||
137 | $media_path = ''; |
||
138 | } else { |
||
139 | // Don't add media |
||
140 | $media_path = null; |
||
141 | } |
||
142 | |||
143 | $resource = $this->export($tree, $sort_by_xref, $encoding, $access_level, $line_endings, $records, $zip_filesystem, $media_path); |
||
144 | |||
145 | if ($format === 'gedzip') { |
||
146 | $zip_filesystem->writeStream('gedcom.ged', $resource); |
||
147 | $extension = '.gdz'; |
||
148 | } else { |
||
149 | $zip_filesystem->writeStream($filename . '.ged', $resource); |
||
150 | $extension = '.zip'; |
||
151 | } |
||
152 | |||
153 | fclose($resource); |
||
154 | |||
155 | $stream = $this->stream_factory->createStreamFromFile($temp_zip_file); |
||
156 | |||
157 | return $this->response_factory->createResponse() |
||
158 | ->withBody($stream) |
||
159 | ->withHeader('content-type', 'application/zip') |
||
160 | ->withHeader('content-disposition', 'attachment; filename="' . addcslashes($filename, '"') . $extension . '"'); |
||
161 | } |
||
162 | |||
163 | /** |
||
164 | * Write GEDCOM data to a stream. |
||
165 | * |
||
166 | * @param Tree $tree - Export data from this tree |
||
167 | * @param bool $sort_by_xref - Write GEDCOM records in XREF order |
||
168 | * @param string $encoding - Convert from UTF-8 to other encoding |
||
169 | * @param int $access_level - Apply privacy filtering |
||
170 | * @param string $line_endings - CRLF or LF |
||
171 | * @param Collection<int,string>|null $records - Just export these records |
||
172 | * @param FilesystemOperator|null $zip_filesystem - Write media files to this filesystem |
||
173 | * @param string|null $media_path - Location within the zip filesystem |
||
174 | * |
||
175 | * @return resource |
||
176 | */ |
||
177 | public function export( |
||
178 | Tree $tree, |
||
179 | bool $sort_by_xref = false, |
||
180 | string $encoding = UTF8::NAME, |
||
181 | int $access_level = Auth::PRIV_HIDE, |
||
182 | string $line_endings = 'CRLF', |
||
183 | Collection $records = null, |
||
184 | FilesystemOperator $zip_filesystem = null, |
||
185 | string $media_path = null |
||
186 | ) { |
||
187 | $stream = fopen('php://memory', 'wb+'); |
||
188 | |||
189 | if ($stream === false) { |
||
190 | throw new RuntimeException('Failed to create temporary stream'); |
||
191 | } |
||
192 | |||
193 | stream_filter_append($stream, GedcomEncodingFilter::class, STREAM_FILTER_WRITE, ['src_encoding' => UTF8::NAME, 'dst_encoding' => $encoding]); |
||
194 | |||
195 | if ($records instanceof Collection) { |
||
196 | // Export just these records - e.g. from clippings cart. |
||
197 | $data = [ |
||
198 | new Collection([$this->createHeader($tree, $encoding, false)]), |
||
|
|||
199 | $records, |
||
200 | new Collection(['0 TRLR']), |
||
201 | ]; |
||
202 | } elseif ($access_level === Auth::PRIV_HIDE) { |
||
203 | // If we will be applying privacy filters, then we will need the GEDCOM record objects. |
||
204 | $data = [ |
||
205 | new Collection([$this->createHeader($tree, $encoding, true)]), |
||
206 | $this->individualQuery($tree, $sort_by_xref)->cursor(), |
||
207 | $this->familyQuery($tree, $sort_by_xref)->cursor(), |
||
208 | $this->sourceQuery($tree, $sort_by_xref)->cursor(), |
||
209 | $this->otherQuery($tree, $sort_by_xref)->cursor(), |
||
210 | $this->mediaQuery($tree, $sort_by_xref)->cursor(), |
||
211 | new Collection(['0 TRLR']), |
||
212 | ]; |
||
213 | } else { |
||
214 | // Disable the pending changes before creating GEDCOM records. |
||
215 | Registry::cache()->array()->remember(AbstractGedcomRecordFactory::class . $tree->id(), static function (): Collection { |
||
216 | return new Collection(); |
||
217 | }); |
||
218 | |||
219 | $data = [ |
||
220 | new Collection([$this->createHeader($tree, $encoding, true)]), |
||
221 | $this->individualQuery($tree, $sort_by_xref)->get()->map(Registry::individualFactory()->mapper($tree)), |
||
222 | $this->familyQuery($tree, $sort_by_xref)->get()->map(Registry::familyFactory()->mapper($tree)), |
||
223 | $this->sourceQuery($tree, $sort_by_xref)->get()->map(Registry::sourceFactory()->mapper($tree)), |
||
224 | $this->otherQuery($tree, $sort_by_xref)->get()->map(Registry::gedcomRecordFactory()->mapper($tree)), |
||
225 | $this->mediaQuery($tree, $sort_by_xref)->get()->map(Registry::mediaFactory()->mapper($tree)), |
||
226 | new Collection(['0 TRLR']), |
||
227 | ]; |
||
228 | } |
||
229 | |||
230 | $media_filesystem = Registry::filesystem()->media($tree); |
||
231 | |||
232 | foreach ($data as $rows) { |
||
233 | foreach ($rows as $datum) { |
||
234 | if (is_string($datum)) { |
||
235 | $gedcom = $datum; |
||
236 | } elseif ($datum instanceof GedcomRecord) { |
||
237 | $gedcom = $datum->privatizeGedcom($access_level); |
||
238 | } else { |
||
239 | $gedcom = |
||
240 | $datum->i_gedcom ?? |
||
241 | $datum->f_gedcom ?? |
||
242 | $datum->s_gedcom ?? |
||
243 | $datum->m_gedcom ?? |
||
244 | $datum->o_gedcom; |
||
245 | } |
||
246 | |||
247 | if ($media_path !== null && $zip_filesystem !== null && preg_match('/0 @' . Gedcom::REGEX_XREF . '@ OBJE/', $gedcom) === 1) { |
||
248 | preg_match_all('/\n1 FILE (.+)/', $gedcom, $matches, PREG_SET_ORDER); |
||
249 | |||
250 | foreach ($matches as $match) { |
||
251 | $media_file = $match[1]; |
||
252 | |||
253 | if ($media_filesystem->fileExists($media_file)) { |
||
254 | $zip_filesystem->writeStream($media_path . $media_file, $media_filesystem->readStream($media_file)); |
||
255 | } |
||
256 | } |
||
257 | } |
||
258 | |||
259 | $gedcom = $this->wrapLongLines($gedcom, Gedcom::LINE_LENGTH) . "\n"; |
||
260 | |||
261 | if ($line_endings === 'CRLF') { |
||
262 | $gedcom = strtr($gedcom, ["\n" => "\r\n"]); |
||
263 | } |
||
264 | |||
265 | $bytes_written = fwrite($stream, $gedcom); |
||
266 | |||
267 | if ($bytes_written !== strlen($gedcom)) { |
||
268 | throw new RuntimeException('Unable to write to stream. Perhaps the disk is full?'); |
||
269 | } |
||
270 | } |
||
271 | } |
||
272 | |||
273 | if (rewind($stream) === false) { |
||
274 | throw new RuntimeException('Cannot rewind temporary stream'); |
||
275 | } |
||
276 | |||
277 | return $stream; |
||
278 | } |
||
279 | |||
280 | /** |
||
281 | * Create a header record for a gedcom file. |
||
282 | * |
||
283 | * @param Tree $tree |
||
284 | * @param string $encoding |
||
285 | * @param bool $include_sub |
||
286 | * |
||
287 | * @return string |
||
288 | */ |
||
289 | public function createHeader(Tree $tree, string $encoding, bool $include_sub): string |
||
290 | { |
||
291 | // Force a ".ged" suffix |
||
292 | $filename = $tree->name(); |
||
293 | |||
294 | if (strtolower(pathinfo($filename, PATHINFO_EXTENSION)) !== 'ged') { |
||
295 | $filename .= '.ged'; |
||
296 | } |
||
297 | |||
298 | $gedcom_encodings = [ |
||
299 | UTF16BE::NAME => 'UNICODE', |
||
300 | UTF16LE::NAME => 'UNICODE', |
||
301 | Windows1252::NAME => 'ANSI', |
||
302 | ]; |
||
303 | |||
304 | $encoding = $gedcom_encodings[$encoding] ?? $encoding; |
||
305 | |||
306 | // Build a new header record |
||
307 | $gedcom = '0 HEAD'; |
||
308 | $gedcom .= "\n1 SOUR " . Webtrees::NAME; |
||
309 | $gedcom .= "\n2 NAME " . Webtrees::NAME; |
||
310 | $gedcom .= "\n2 VERS " . Webtrees::VERSION; |
||
311 | $gedcom .= "\n1 DEST DISKETTE"; |
||
312 | $gedcom .= "\n1 DATE " . strtoupper(date('d M Y')); |
||
313 | $gedcom .= "\n2 TIME " . date('H:i:s'); |
||
314 | $gedcom .= "\n1 GEDC\n2 VERS 5.5.1\n2 FORM LINEAGE-LINKED"; |
||
315 | $gedcom .= "\n1 CHAR " . $encoding; |
||
316 | $gedcom .= "\n1 FILE " . $filename; |
||
317 | |||
318 | // Preserve some values from the original header |
||
319 | $header = Registry::headerFactory()->make('HEAD', $tree) ?? Registry::headerFactory()->new('HEAD', '0 HEAD', null, $tree); |
||
320 | |||
321 | foreach ($header->facts(['COPR', 'LANG', 'PLAC', 'NOTE']) as $fact) { |
||
322 | $gedcom .= "\n" . $fact->gedcom(); |
||
323 | } |
||
324 | |||
325 | if ($include_sub) { |
||
326 | foreach ($header->facts(['SUBM', 'SUBN']) as $fact) { |
||
327 | $gedcom .= "\n" . $fact->gedcom(); |
||
328 | } |
||
329 | } |
||
330 | |||
331 | return $gedcom; |
||
332 | } |
||
333 | |||
334 | /** |
||
335 | * Prepend a media path, such as might have been removed during import. |
||
336 | * |
||
337 | * @param string $gedcom |
||
338 | * @param string $media_path |
||
339 | * |
||
340 | * @return string |
||
341 | */ |
||
342 | private function convertMediaPath(string $gedcom, string $media_path): string |
||
343 | { |
||
344 | if (preg_match('/^0 @[^@]+@ OBJE/', $gedcom)) { |
||
345 | return preg_replace_callback('/\n1 FILE (.+)/', static function (array $match) use ($media_path): string { |
||
346 | $filename = $match[1]; |
||
347 | |||
348 | // Don’t modify external links |
||
349 | if (!str_contains($filename, '://')) { |
||
350 | $filename = $media_path . $filename; |
||
351 | } |
||
352 | |||
353 | return "\n1 FILE " . $filename; |
||
354 | }, $gedcom); |
||
355 | } |
||
356 | |||
357 | return $gedcom; |
||
358 | } |
||
359 | |||
360 | /** |
||
361 | * Wrap long lines using concatenation records. |
||
362 | * |
||
363 | * @param string $gedcom |
||
364 | * @param int $max_line_length |
||
365 | * |
||
366 | * @return string |
||
367 | */ |
||
368 | public function wrapLongLines(string $gedcom, int $max_line_length): string |
||
369 | { |
||
370 | $lines = []; |
||
371 | |||
372 | foreach (explode("\n", $gedcom) as $line) { |
||
373 | // Split long lines |
||
374 | // The total length of a GEDCOM line, including level number, cross-reference number, |
||
375 | // tag, value, delimiters, and terminator, must not exceed 255 (wide) characters. |
||
376 | if (mb_strlen($line) > $max_line_length) { |
||
377 | [$level, $tag] = explode(' ', $line, 3); |
||
378 | if ($tag !== 'CONT') { |
||
379 | $level++; |
||
380 | } |
||
381 | do { |
||
382 | // Split after $pos chars |
||
383 | $pos = $max_line_length; |
||
384 | // Split on a non-space (standard gedcom behavior) |
||
385 | while (mb_substr($line, $pos - 1, 1) === ' ') { |
||
386 | --$pos; |
||
387 | } |
||
388 | if ($pos === strpos($line, ' ', 3)) { |
||
389 | // No non-spaces in the data! Can’t split it :-( |
||
390 | break; |
||
391 | } |
||
392 | $lines[] = mb_substr($line, 0, $pos); |
||
393 | $line = $level . ' CONC ' . mb_substr($line, $pos); |
||
394 | } while (mb_strlen($line) > $max_line_length); |
||
395 | } |
||
396 | $lines[] = $line; |
||
397 | } |
||
398 | |||
399 | return implode("\n", $lines); |
||
400 | } |
||
401 | |||
402 | /** |
||
403 | * @param Tree $tree |
||
404 | * @param bool $sort_by_xref |
||
405 | * |
||
406 | * @return Builder |
||
407 | */ |
||
408 | private function familyQuery(Tree $tree, bool $sort_by_xref): Builder |
||
422 | } |
||
423 | |||
424 | /** |
||
425 | * @param Tree $tree |
||
426 | * @param bool $sort_by_xref |
||
427 | * |
||
428 | * @return Builder |
||
429 | */ |
||
430 | private function individualQuery(Tree $tree, bool $sort_by_xref): Builder |
||
431 | { |
||
432 | $query = DB::table('individuals') |
||
433 | ->where('i_file', '=', $tree->id()) |
||
434 | ->select(['i_gedcom', 'i_id']); |
||
435 | |||
436 | if ($sort_by_xref) { |
||
437 | $query |
||
438 | ->orderBy(new Expression('LENGTH(i_id)')) |
||
439 | ->orderBy('i_id'); |
||
440 | } |
||
441 | |||
442 | return $query; |
||
443 | } |
||
444 | |||
445 | /** |
||
446 | * @param Tree $tree |
||
447 | * @param bool $sort_by_xref |
||
448 | * |
||
449 | * @return Builder |
||
450 | */ |
||
451 | private function sourceQuery(Tree $tree, bool $sort_by_xref): Builder |
||
452 | { |
||
453 | $query = DB::table('sources') |
||
454 | ->where('s_file', '=', $tree->id()) |
||
455 | ->select(['s_gedcom', 's_id']); |
||
456 | |||
457 | if ($sort_by_xref) { |
||
458 | $query |
||
459 | ->orderBy(new Expression('LENGTH(s_id)')) |
||
460 | ->orderBy('s_id'); |
||
461 | } |
||
462 | |||
463 | return $query; |
||
464 | } |
||
465 | |||
466 | /** |
||
467 | * @param Tree $tree |
||
468 | * @param bool $sort_by_xref |
||
469 | * |
||
470 | * @return Builder |
||
471 | */ |
||
472 | private function mediaQuery(Tree $tree, bool $sort_by_xref): Builder |
||
485 | } |
||
486 | |||
487 | /** |
||
488 | * @param Tree $tree |
||
489 | * @param bool $sort_by_xref |
||
490 | * |
||
491 | * @return Builder |
||
492 | */ |
||
493 | private function otherQuery(Tree $tree, bool $sort_by_xref): Builder |
||
508 | } |
||
509 | } |
||
510 |