| Total Complexity | 46 |
| Total Lines | 362 |
| Duplicated Lines | 0 % |
| Changes | 2 | ||
| Bugs | 0 | Features | 0 |
Complex classes like GedcomExportService often do a lot of different things. To break such a class down, we need to identify a cohesive component within that class. A common approach to find such a component is to look for fields/methods that share the same prefixes, or suffixes.
Once you have determined the fields that belong together, you can apply the Extract Class refactoring. If the component makes sense as a sub-class, Extract Subclass is also a candidate, and is often faster.
While breaking up the class, it is a good idea to analyze how other classes use GedcomExportService, and based on these observations, apply Extract Interface, too.
| 1 | <?php |
||
| 73 | class GedcomExportService |
||
| 74 | { |
||
| 75 | private const ACCESS_LEVELS = [ |
||
| 76 | 'gedadmin' => Auth::PRIV_NONE, |
||
| 77 | 'user' => Auth::PRIV_USER, |
||
| 78 | 'visitor' => Auth::PRIV_PRIVATE, |
||
| 79 | 'none' => Auth::PRIV_HIDE, |
||
| 80 | ]; |
||
| 81 | |||
| 82 | private ResponseFactoryInterface $response_factory; |
||
| 83 | |||
| 84 | private StreamFactoryInterface $stream_factory; |
||
| 85 | |||
| 86 | public function __construct(ResponseFactoryInterface $response_factory, StreamFactoryInterface $stream_factory) |
||
| 87 | { |
||
| 88 | $this->response_factory = $response_factory; |
||
| 89 | $this->stream_factory = $stream_factory; |
||
| 90 | } |
||
| 91 | |||
| 92 | /** |
||
| 93 | * @param Tree $tree Export data from this tree |
||
| 94 | * @param bool $sort_by_xref Write GEDCOM records in XREF order |
||
| 95 | * @param string $encoding Convert from UTF-8 to other encoding |
||
| 96 | * @param string $privacy Filter records by role |
||
| 97 | * @param string $line_endings CRLF or LF |
||
| 98 | * @param string $filename Name of download file, without an extension |
||
| 99 | * @param string $format One of: gedcom, zip, zipmedia, gedzip |
||
| 100 | * @param Collection<int,string|object|GedcomRecord>|null $records |
||
| 101 | */ |
||
| 102 | public function downloadResponse( |
||
| 103 | Tree $tree, |
||
| 104 | bool $sort_by_xref, |
||
| 105 | string $encoding, |
||
| 106 | string $privacy, |
||
| 107 | string $line_endings, |
||
| 108 | string $filename, |
||
| 109 | string $format, |
||
| 110 | Collection $records = null |
||
| 111 | ): ResponseInterface { |
||
| 112 | $access_level = self::ACCESS_LEVELS[$privacy]; |
||
| 113 | |||
| 114 | if ($format === 'gedcom') { |
||
| 115 | $resource = $this->export($tree, $sort_by_xref, $encoding, $access_level, $line_endings, $records); |
||
| 116 | $stream = $this->stream_factory->createStreamFromResource($resource); |
||
| 117 | |||
| 118 | return $this->response_factory->createResponse() |
||
| 119 | ->withBody($stream) |
||
| 120 | ->withHeader('content-type', 'text/x-gedcom; charset=' . UTF8::NAME) |
||
| 121 | ->withHeader('content-disposition', 'attachment; filename="' . addcslashes($filename, '"') . '.ged"'); |
||
| 122 | } |
||
| 123 | |||
| 124 | // Create a new/empty .ZIP file |
||
| 125 | $temp_zip_file = stream_get_meta_data(tmpfile())['uri']; |
||
| 126 | $zip_provider = new FilesystemZipArchiveProvider($temp_zip_file, 0755); |
||
| 127 | $zip_adapter = new ZipArchiveAdapter($zip_provider); |
||
| 128 | $zip_filesystem = new Filesystem($zip_adapter); |
||
| 129 | |||
| 130 | if ($format === 'zipmedia') { |
||
| 131 | $media_path = $tree->getPreference('MEDIA_DIRECTORY'); |
||
| 132 | } elseif ($format === 'gedzip') { |
||
| 133 | $media_path = ''; |
||
| 134 | } else { |
||
| 135 | // Don't add media |
||
| 136 | $media_path = null; |
||
| 137 | } |
||
| 138 | |||
| 139 | $resource = $this->export($tree, $sort_by_xref, $encoding, $access_level, $line_endings, $records, $zip_filesystem, $media_path); |
||
| 140 | |||
| 141 | if ($format === 'gedzip') { |
||
| 142 | $zip_filesystem->writeStream('gedcom.ged', $resource); |
||
| 143 | $extension = '.gdz'; |
||
| 144 | } else { |
||
| 145 | $zip_filesystem->writeStream($filename . '.ged', $resource); |
||
| 146 | $extension = '.zip'; |
||
| 147 | } |
||
| 148 | |||
| 149 | fclose($resource); |
||
| 150 | |||
| 151 | $stream = $this->stream_factory->createStreamFromFile($temp_zip_file); |
||
| 152 | |||
| 153 | return $this->response_factory->createResponse() |
||
| 154 | ->withBody($stream) |
||
| 155 | ->withHeader('content-type', 'application/zip') |
||
| 156 | ->withHeader('content-disposition', 'attachment; filename="' . addcslashes($filename, '"') . $extension . '"'); |
||
| 157 | } |
||
| 158 | |||
| 159 | /** |
||
| 160 | * Write GEDCOM data to a stream. |
||
| 161 | * |
||
| 162 | * @param Tree $tree Export data from this tree |
||
| 163 | * @param bool $sort_by_xref Write GEDCOM records in XREF order |
||
| 164 | * @param string $encoding Convert from UTF-8 to other encoding |
||
| 165 | * @param int $access_level Apply privacy filtering |
||
| 166 | * @param string $line_endings CRLF or LF |
||
| 167 | * @param Collection<int,string|object|GedcomRecord>|null $records Just export these records |
||
| 168 | * @param FilesystemOperator|null $zip_filesystem Write media files to this filesystem |
||
| 169 | * @param string|null $media_path Location within the zip filesystem |
||
| 170 | * |
||
| 171 | * @return resource |
||
| 172 | */ |
||
| 173 | public function export( |
||
| 174 | Tree $tree, |
||
| 175 | bool $sort_by_xref = false, |
||
| 176 | string $encoding = UTF8::NAME, |
||
| 177 | int $access_level = Auth::PRIV_HIDE, |
||
| 178 | string $line_endings = 'CRLF', |
||
| 179 | Collection|null $records = null, |
||
| 180 | FilesystemOperator|null $zip_filesystem = null, |
||
| 181 | string $media_path = null |
||
| 182 | ) { |
||
| 183 | $stream = fopen('php://memory', 'wb+'); |
||
| 184 | |||
| 185 | if ($stream === false) { |
||
| 186 | throw new RuntimeException('Failed to create temporary stream'); |
||
| 187 | } |
||
| 188 | |||
| 189 | stream_filter_append($stream, GedcomEncodingFilter::class, STREAM_FILTER_WRITE, ['src_encoding' => UTF8::NAME, 'dst_encoding' => $encoding]); |
||
| 190 | |||
| 191 | if ($records instanceof Collection) { |
||
| 192 | // Export just these records - e.g. from clippings cart. |
||
| 193 | $data = [ |
||
| 194 | new Collection([$this->createHeader($tree, $encoding, false)]), |
||
|
|
|||
| 195 | $records, |
||
| 196 | new Collection(['0 TRLR']), |
||
| 197 | ]; |
||
| 198 | } elseif ($access_level === Auth::PRIV_HIDE) { |
||
| 199 | // If we will be applying privacy filters, then we will need the GEDCOM record objects. |
||
| 200 | $data = [ |
||
| 201 | new Collection([$this->createHeader($tree, $encoding, true)]), |
||
| 202 | $this->individualQuery($tree, $sort_by_xref)->cursor(), |
||
| 203 | $this->familyQuery($tree, $sort_by_xref)->cursor(), |
||
| 204 | $this->sourceQuery($tree, $sort_by_xref)->cursor(), |
||
| 205 | $this->otherQuery($tree, $sort_by_xref)->cursor(), |
||
| 206 | $this->mediaQuery($tree, $sort_by_xref)->cursor(), |
||
| 207 | new Collection(['0 TRLR']), |
||
| 208 | ]; |
||
| 209 | } else { |
||
| 210 | // Disable the pending changes before creating GEDCOM records. |
||
| 211 | Registry::cache()->array()->remember(AbstractGedcomRecordFactory::class . $tree->id(), static fn (): Collection => new Collection()); |
||
| 212 | |||
| 213 | $data = [ |
||
| 214 | new Collection([$this->createHeader($tree, $encoding, true)]), |
||
| 215 | $this->individualQuery($tree, $sort_by_xref)->get()->map(Registry::individualFactory()->mapper($tree)), |
||
| 216 | $this->familyQuery($tree, $sort_by_xref)->get()->map(Registry::familyFactory()->mapper($tree)), |
||
| 217 | $this->sourceQuery($tree, $sort_by_xref)->get()->map(Registry::sourceFactory()->mapper($tree)), |
||
| 218 | $this->otherQuery($tree, $sort_by_xref)->get()->map(Registry::gedcomRecordFactory()->mapper($tree)), |
||
| 219 | $this->mediaQuery($tree, $sort_by_xref)->get()->map(Registry::mediaFactory()->mapper($tree)), |
||
| 220 | new Collection(['0 TRLR']), |
||
| 221 | ]; |
||
| 222 | } |
||
| 223 | |||
| 224 | $media_filesystem = $tree->mediaFilesystem(); |
||
| 225 | |||
| 226 | foreach ($data as $rows) { |
||
| 227 | foreach ($rows as $datum) { |
||
| 228 | if (is_string($datum)) { |
||
| 229 | $gedcom = $datum; |
||
| 230 | } elseif ($datum instanceof GedcomRecord) { |
||
| 231 | $gedcom = $datum->privatizeGedcom($access_level); |
||
| 232 | |||
| 233 | if ($gedcom === '') { |
||
| 234 | continue; |
||
| 235 | } |
||
| 236 | } else { |
||
| 237 | $gedcom = |
||
| 238 | $datum->i_gedcom ?? |
||
| 239 | $datum->f_gedcom ?? |
||
| 240 | $datum->s_gedcom ?? |
||
| 241 | $datum->m_gedcom ?? |
||
| 242 | $datum->o_gedcom; |
||
| 243 | } |
||
| 244 | |||
| 245 | if ($media_path !== null && $zip_filesystem !== null && preg_match('/0 @' . Gedcom::REGEX_XREF . '@ OBJE/', $gedcom) === 1) { |
||
| 246 | preg_match_all('/\n1 FILE (.+)/', $gedcom, $matches, PREG_SET_ORDER); |
||
| 247 | |||
| 248 | foreach ($matches as $match) { |
||
| 249 | $media_file = $match[1]; |
||
| 250 | |||
| 251 | if ($media_filesystem->fileExists($media_file)) { |
||
| 252 | $zip_filesystem->writeStream($media_path . $media_file, $media_filesystem->readStream($media_file)); |
||
| 253 | } |
||
| 254 | } |
||
| 255 | } |
||
| 256 | |||
| 257 | $gedcom = $this->wrapLongLines($gedcom, Gedcom::LINE_LENGTH) . "\n"; |
||
| 258 | |||
| 259 | if ($line_endings === 'CRLF') { |
||
| 260 | $gedcom = strtr($gedcom, ["\n" => "\r\n"]); |
||
| 261 | } |
||
| 262 | |||
| 263 | $bytes_written = fwrite($stream, $gedcom); |
||
| 264 | |||
| 265 | if ($bytes_written !== strlen($gedcom)) { |
||
| 266 | throw new RuntimeException('Unable to write to stream. Perhaps the disk is full?'); |
||
| 267 | } |
||
| 268 | } |
||
| 269 | } |
||
| 270 | |||
| 271 | if (rewind($stream) === false) { |
||
| 272 | throw new RuntimeException('Cannot rewind temporary stream'); |
||
| 273 | } |
||
| 274 | |||
| 275 | return $stream; |
||
| 276 | } |
||
| 277 | |||
| 278 | public function createHeader(Tree $tree, string $encoding, bool $include_sub): string |
||
| 279 | { |
||
| 280 | // Force a ".ged" suffix |
||
| 281 | $filename = $tree->name(); |
||
| 282 | |||
| 283 | if (strtolower(pathinfo($filename, PATHINFO_EXTENSION)) !== 'ged') { |
||
| 284 | $filename .= '.ged'; |
||
| 285 | } |
||
| 286 | |||
| 287 | $gedcom_encodings = [ |
||
| 288 | UTF16BE::NAME => 'UNICODE', |
||
| 289 | UTF16LE::NAME => 'UNICODE', |
||
| 290 | Windows1252::NAME => 'ANSI', |
||
| 291 | ]; |
||
| 292 | |||
| 293 | $encoding = $gedcom_encodings[$encoding] ?? $encoding; |
||
| 294 | |||
| 295 | // Build a new header record |
||
| 296 | $gedcom = '0 HEAD'; |
||
| 297 | $gedcom .= "\n1 SOUR " . Webtrees::NAME; |
||
| 298 | $gedcom .= "\n2 NAME " . Webtrees::NAME; |
||
| 299 | $gedcom .= "\n2 VERS " . Webtrees::VERSION; |
||
| 300 | $gedcom .= "\n1 DEST DISKETTE"; |
||
| 301 | $gedcom .= "\n1 DATE " . strtoupper(date('d M Y')); |
||
| 302 | $gedcom .= "\n2 TIME " . date('H:i:s'); |
||
| 303 | $gedcom .= "\n1 GEDC\n2 VERS 5.5.1\n2 FORM LINEAGE-LINKED"; |
||
| 304 | $gedcom .= "\n1 CHAR " . $encoding; |
||
| 305 | $gedcom .= "\n1 FILE " . $filename; |
||
| 306 | |||
| 307 | // Preserve some values from the original header |
||
| 308 | $header = Registry::headerFactory()->make('HEAD', $tree) ?? Registry::headerFactory()->new('HEAD', '0 HEAD', null, $tree); |
||
| 309 | |||
| 310 | // There should always be a header record. |
||
| 311 | if ($header instanceof Header) { |
||
| 312 | foreach ($header->facts(['COPR', 'LANG', 'PLAC', 'NOTE']) as $fact) { |
||
| 313 | $gedcom .= "\n" . $fact->gedcom(); |
||
| 314 | } |
||
| 315 | |||
| 316 | if ($include_sub) { |
||
| 317 | foreach ($header->facts(['SUBM', 'SUBN']) as $fact) { |
||
| 318 | $gedcom .= "\n" . $fact->gedcom(); |
||
| 319 | } |
||
| 320 | } |
||
| 321 | } |
||
| 322 | |||
| 323 | return $gedcom; |
||
| 324 | } |
||
| 325 | |||
| 326 | public function wrapLongLines(string $gedcom, int $max_line_length): string |
||
| 327 | { |
||
| 328 | $lines = []; |
||
| 329 | |||
| 330 | foreach (explode("\n", $gedcom) as $line) { |
||
| 331 | // Split long lines |
||
| 332 | // The total length of a GEDCOM line, including level number, cross-reference number, |
||
| 333 | // tag, value, delimiters, and terminator, must not exceed 255 (wide) characters. |
||
| 334 | if (mb_strlen($line) > $max_line_length) { |
||
| 335 | [$level, $tag] = explode(' ', $line, 3); |
||
| 336 | if ($tag !== 'CONT') { |
||
| 337 | $level++; |
||
| 338 | } |
||
| 339 | do { |
||
| 340 | // Split after $pos chars |
||
| 341 | $pos = $max_line_length; |
||
| 342 | // Split on a non-space (standard gedcom behavior) |
||
| 343 | while (mb_substr($line, $pos - 1, 1) === ' ') { |
||
| 344 | --$pos; |
||
| 345 | } |
||
| 346 | if ($pos === strpos($line, ' ', 3)) { |
||
| 347 | // No non-spaces in the data! Can’t split it :-( |
||
| 348 | break; |
||
| 349 | } |
||
| 350 | $lines[] = mb_substr($line, 0, $pos); |
||
| 351 | $line = $level . ' CONC ' . mb_substr($line, $pos); |
||
| 352 | } while (mb_strlen($line) > $max_line_length); |
||
| 353 | } |
||
| 354 | $lines[] = $line; |
||
| 355 | } |
||
| 356 | |||
| 357 | return implode("\n", $lines); |
||
| 358 | } |
||
| 359 | |||
| 360 | private function familyQuery(Tree $tree, bool $sort_by_xref): Builder |
||
| 373 | } |
||
| 374 | |||
| 375 | private function individualQuery(Tree $tree, bool $sort_by_xref): Builder |
||
| 376 | { |
||
| 377 | $query = DB::table('individuals') |
||
| 378 | ->where('i_file', '=', $tree->id()) |
||
| 379 | ->select(['i_gedcom', 'i_id']); |
||
| 380 | |||
| 381 | if ($sort_by_xref) { |
||
| 382 | $query |
||
| 383 | ->orderBy(new Expression('LENGTH(i_id)')) |
||
| 384 | ->orderBy('i_id'); |
||
| 385 | } |
||
| 386 | |||
| 387 | return $query; |
||
| 388 | } |
||
| 389 | |||
| 390 | private function sourceQuery(Tree $tree, bool $sort_by_xref): Builder |
||
| 391 | { |
||
| 392 | $query = DB::table('sources') |
||
| 393 | ->where('s_file', '=', $tree->id()) |
||
| 394 | ->select(['s_gedcom', 's_id']); |
||
| 395 | |||
| 396 | if ($sort_by_xref) { |
||
| 397 | $query |
||
| 398 | ->orderBy(new Expression('LENGTH(s_id)')) |
||
| 399 | ->orderBy('s_id'); |
||
| 400 | } |
||
| 401 | |||
| 402 | return $query; |
||
| 403 | } |
||
| 404 | |||
| 405 | private function mediaQuery(Tree $tree, bool $sort_by_xref): Builder |
||
| 418 | } |
||
| 419 | |||
| 420 | private function otherQuery(Tree $tree, bool $sort_by_xref): Builder |
||
| 435 | } |
||
| 436 | } |
||
| 437 |