Passed
Push — main ( 7be741...28b704 )
by Jonathan
04:17
created

SosaStatisticsService::isPdoSupported()   A

Complexity

Conditions 1
Paths 1

Size

Total Lines 3
Code Lines 1

Duplication

Lines 0
Ratio 0 %

Importance

Changes 1
Bugs 0 Features 0
Metric Value
cc 1
eloc 1
c 1
b 0
f 0
nc 1
nop 0
dl 0
loc 3
rs 10
1
<?php
2
3
/**
4
 * webtrees-lib: MyArtJaub library for webtrees
5
 *
6
 * @package MyArtJaub\Webtrees
7
 * @subpackage Sosa
8
 * @author Jonathan Jaubart <[email protected]>
9
 * @copyright Copyright (c) 2009-2022, Jonathan Jaubart
10
 * @license http://www.gnu.org/licenses/gpl.html GNU General Public License, version 3
11
 */
12
13
declare(strict_types=1);
14
15
namespace MyArtJaub\Webtrees\Module\Sosa\Services;
16
17
use Fisharebest\Webtrees\Individual;
18
use Fisharebest\Webtrees\Registry;
19
use Fisharebest\Webtrees\Tree;
20
use Fisharebest\Webtrees\Contracts\UserInterface;
21
use Illuminate\Database\Capsule\Manager as DB;
22
use Illuminate\Database\Query\Builder;
23
use Illuminate\Database\Query\JoinClause;
24
use Illuminate\Support\Collection;
25
use stdClass;
26
27
/**
28
 * Service for retrieving Sosa statistics
29
 */
30
class SosaStatisticsService
31
{
32
    private UserInterface $user;
33
    private Tree $tree;
34
35
    /**
36
     * Constructor for Sosa Statistics Service
37
     *
38
     * @param Tree $tree
39
     * @param UserInterface $user
40
     */
41
    public function __construct(Tree $tree, UserInterface $user)
42
    {
43
        $this->tree = $tree;
44
        $this->user = $user;
45
    }
46
47
    /**
48
     * Check if PDO support the queries used in Sosa statistics.
49
     *
50
     * SQLite does not support RIGHT and FULL JOIN, and POWER/SQRT require a specific compilation flag.
51
     *
52
     * @return bool
53
     */
54
    public function isPdoSupported(): bool
55
    {
56
        return DB::connection()->getDriverName() !== 'sqlite';
57
    }
58
59
    /**
60
     * Return the root individual for the reference tree and user.
61
     *
62
     * @return Individual|NULL
63
     */
64
    public function rootIndividual(): ?Individual
65
    {
66
        $root_indi_id = $this->tree->getUserPreference($this->user, 'MAJ_SOSA_ROOT_ID');
67
        return Registry::individualFactory()->make($root_indi_id, $this->tree);
68
    }
69
70
    /**
71
     * Get the highest generation for the reference tree and user.
72
     *
73
     * @return int
74
     */
75
    public function maxGeneration(): int
76
    {
77
        return (int) DB::table('maj_sosa')
78
            ->where('majs_gedcom_id', '=', $this->tree->id())
79
            ->where('majs_user_id', '=', $this->user->id())
80
            ->max('majs_gen');
81
    }
82
83
    /**
84
     * Get the total count of individuals in the tree.
85
     *
86
     * @return int
87
     */
88
    public function totalIndividuals(): int
89
    {
90
        return DB::table('individuals')
91
            ->where('i_file', '=', $this->tree->id())
92
            ->count();
93
    }
94
95
    /**
96
     * Get the total count of Sosa ancestors for all generations
97
     *
98
     * @return int
99
     */
100
    public function totalAncestors(): int
101
    {
102
        return DB::table('maj_sosa')
103
            ->where('majs_gedcom_id', '=', $this->tree->id())
104
            ->where('majs_user_id', '=', $this->user->id())
105
            ->count();
106
    }
107
108
    /**
109
     * Get the total count of Sosa ancestors for a generation
110
     *
111
     * @return int
112
     */
113
    public function totalAncestorsAtGeneration(int $gen): int
114
    {
115
        return DB::table('maj_sosa')
116
            ->where('majs_gedcom_id', '=', $this->tree->id())
117
            ->where('majs_user_id', '=', $this->user->id())
118
            ->where('majs_gen', '=', $gen)
119
            ->count();
120
    }
121
122
    /**
123
     * Get the total count of distinct Sosa ancestors for all generations
124
     *
125
     * @return int
126
     */
127
    public function totalDistinctAncestors(): int
128
    {
129
        return DB::table('maj_sosa')
130
            ->where('majs_gedcom_id', '=', $this->tree->id())
131
            ->where('majs_user_id', '=', $this->user->id())
132
            ->distinct()
133
            ->count('majs_i_id');
134
    }
135
136
    /**
137
     * Get the mean generation time, as the slope of the linear regression of birth years vs generations
138
     *
139
     * @return float
140
     */
141
    public function meanGenerationTime(): float
142
    {
143
        $row = DB::table('maj_sosa')
144
            ->where('majs_gedcom_id', '=', $this->tree->id())
145
            ->where('majs_user_id', '=', $this->user->id())
146
            ->whereNotNull('majs_birth_year')
147
            ->selectRaw('COUNT(majs_sosa) AS n')
148
            ->selectRaw('SUM(majs_gen * majs_birth_year) AS sum_xy')
149
            ->selectRaw('SUM(majs_gen) AS sum_x')
150
            ->selectRaw('SUM(majs_birth_year) AS sum_y')
151
            ->selectRaw('SUM(majs_gen * majs_gen) AS sum_x2')
152
            ->get()->first();
153
154
        return $row->n == 0 ? 0 :
155
            -($row->n * $row->sum_xy - $row->sum_x * $row->sum_y) / ($row->n * $row->sum_x2 - pow($row->sum_x, 2));
156
    }
157
158
    /**
159
     * Get the statistic array detailed by generation.
160
     * Statistics for each generation are:
161
     *  - The number of Sosa in generation
162
     *  - The number of Sosa up to generation
163
     *  - The number of distinct Sosa up to generation
164
     *  - The year of the first birth in generation
165
     *  - The year of the first estimated birth in generation
166
     *  - The year of the last birth in generation
167
     *  - The year of the last estimated birth in generation
168
     *  - The average year of birth in generation
169
     *
170
     * @return array<int, array<string, int|null>> Statistics array
171
     */
172
    public function statisticsByGenerations(): array
173
    {
174
        $stats_by_gen = $this->statisticsByGenerationBasicData();
175
        $cumul_stats_by_gen = $this->statisticsByGenerationCumulativeData();
176
177
        $statistics_by_gen = [];
178
        foreach ($stats_by_gen as $gen => $stats_gen) {
179
            $statistics_by_gen[(int) $stats_gen->gen] = array(
180
                'sosaCount'             =>  (int) $stats_gen->total_sosa,
181
                'sosaTotalCount'        =>  (int) $cumul_stats_by_gen[$gen]->total_cumul,
182
                'diffSosaTotalCount'    =>  (int) $cumul_stats_by_gen[$gen]->total_distinct_cumul,
183
                'firstBirth'            =>  $stats_gen->first_year,
184
                'firstEstimatedBirth'   =>  $stats_gen->first_est_year,
185
                'lastBirth'             =>  $stats_gen->last_year,
186
                'lastEstimatedBirth'    =>  $stats_gen->last_est_year
187
            );
188
        }
189
190
        return $statistics_by_gen;
191
    }
192
193
    /**
194
     * Returns the basic statistics data by generation.
195
     *
196
     * @return Collection<int, \stdClass>
197
     */
198
    private function statisticsByGenerationBasicData(): Collection
199
    {
200
        return DB::table('maj_sosa')
201
            ->where('majs_gedcom_id', '=', $this->tree->id())
202
            ->where('majs_user_id', '=', $this->user->id())
203
            ->groupBy('majs_gen')
204
            ->orderBy('majs_gen', 'asc')
205
            ->select('majs_gen AS gen')
206
            ->selectRaw('COUNT(majs_sosa) AS total_sosa')
207
            ->selectRaw('MIN(majs_birth_year) AS first_year')
208
            ->selectRaw('MIN(majs_birth_year_est) AS first_est_year')
209
            ->selectRaw('MAX(majs_birth_year) AS last_year')
210
            ->selectRaw('MAX(majs_birth_year_est) AS last_est_year')
211
            ->get()->keyBy('gen');
212
    }
213
214
    /**
215
     * Returns the cumulative statistics data by generation
216
     *
217
     * @return Collection<int, \stdClass>
218
     */
219
    private function statisticsByGenerationCumulativeData(): Collection
220
    {
221
        $list_gen = DB::table('maj_sosa')->select('majs_gen')->distinct()
222
            ->where('majs_gedcom_id', '=', $this->tree->id())
223
            ->where('majs_user_id', '=', $this->user->id());
224
225
        return DB::table('maj_sosa')
226
            ->joinSub($list_gen, 'list_gen', function (JoinClause $join): void {
227
                $join->on('maj_sosa.majs_gen', '<=', 'list_gen.majs_gen')
228
                ->where('majs_gedcom_id', '=', $this->tree->id())
229
                ->where('majs_user_id', '=', $this->user->id());
230
            })
231
            ->groupBy('list_gen.majs_gen')
232
            ->select('list_gen.majs_gen AS gen')
233
            ->selectRaw('COUNT(majs_i_id) AS total_cumul')
234
            ->selectRaw('COUNT(DISTINCT majs_i_id) AS total_distinct_cumul')
235
            ->selectRaw('1 - COUNT(DISTINCT majs_i_id) / COUNT(majs_i_id) AS pedi_collapse_simple')
236
            ->get()->keyBy('gen');
237
    }
238
239
    /**
240
     * Returns the pedigree collapse improved calculation by generation.
241
     *
242
     * Format:
243
     *  - key : generation
244
     *  - values:
245
     *      - pedi_collapse_roots : pedigree collapse of ancestor roots for the generation
246
     *      - pedi_collapse_xgen : pedigree cross-generation shrinkage for the generation
247
     *
248
     * @return array<int, array<string, float>>
249
     */
250
    public function pedigreeCollapseByGenerationData(): array
251
    {
252
        if (!$this->isPdoSupported()) {
253
            return [];
254
        }
255
256
        $table_prefix = DB::connection()->getTablePrefix();
257
258
        $list_gen = DB::table('maj_sosa')->select('majs_gen')->distinct()
259
            ->where('majs_gedcom_id', '=', $this->tree->id())
260
            ->where('majs_user_id', '=', $this->user->id());
261
262
        /* Compute the contributions of nodes of previous generations to the current generation */
263
        $root_ancestors_contributions = DB::table('maj_sosa AS sosa')
264
            ->select(['list_gen.majs_gen AS gen', 'sosa.majs_gedcom_id', 'sosa.majs_user_id'])
265
            ->addSelect(['sosa.majs_i_id', 'sosa.majs_gen'])
266
            ->selectRaw(
267
                '(CASE ' .
268
                    ' WHEN ' . $table_prefix . 'sosa_fat.majs_i_id IS NULL' .
269
                    ' THEN POWER(2, ' . $table_prefix . 'list_gen.majs_gen - ' . $table_prefix . 'sosa.majs_gen - 1)' .
270
                    ' ELSE 0 ' .
271
                ' END)' .
272
                ' + (CASE ' .
273
                    ' WHEN ' . $table_prefix . 'sosa_mot.majs_i_id IS NULL' .
274
                    ' THEN POWER(2, ' . $table_prefix . 'list_gen.majs_gen - ' . $table_prefix . 'sosa.majs_gen - 1)' .
275
                    ' ELSE 0 ' .
276
                ' END) contrib'
277
            )
278
            ->joinSub($list_gen, 'list_gen', function (JoinClause $join): void {
279
                $join->on('sosa.majs_gen', '<', 'list_gen.majs_gen')
280
                    ->where('majs_gedcom_id', '=', $this->tree->id())
281
                    ->where('majs_user_id', '=', $this->user->id());
282
            })
283
            ->leftJoin('maj_sosa AS sosa_fat', function (JoinClause $join) use ($table_prefix): void {
284
                // Link to sosa's father
285
                $join->whereRaw($table_prefix . 'sosa_fat.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa')
286
                    ->where('sosa_fat.majs_gedcom_id', '=', $this->tree->id())
287
                    ->where('sosa_fat.majs_user_id', '=', $this->user->id());
288
            })
289
            ->leftJoin('maj_sosa AS sosa_mot', function (JoinClause $join) use ($table_prefix): void {
290
                // Link to sosa's mother
291
                $join->whereRaw($table_prefix . 'sosa_mot.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa + 1')
292
                    ->where('sosa_mot.majs_gedcom_id', '=', $this->tree->id())
293
                    ->where('sosa_mot.majs_user_id', '=', $this->user->id());
294
            })
295
            ->where('sosa.majs_gedcom_id', '=', $this->tree->id())
296
            ->where('sosa.majs_user_id', '=', $this->user->id())
297
            ->where(function (Builder $query): void {
298
                $query->whereNull('sosa_fat.majs_i_id')
299
                ->orWhereNull('sosa_mot.majs_i_id');
300
            });
301
302
        /* Identify nodes in the generations with ancestors who are also in the same generation.
303
         * This is the vertical/generational collapse that will reduce the number or roots.
304
         */
305
        $non_roots_ancestors = DB::table('maj_sosa AS sosa')
306
            ->select(['sosa.majs_gen', 'sosa.majs_gedcom_id', 'sosa.majs_user_id', 'sosa.majs_sosa'])
307
            ->selectRaw('MAX(' . $table_prefix . 'sosa_anc.majs_sosa) - MIN(' . $table_prefix . 'sosa_anc.majs_sosa)' .
308
                ' AS full_ancestors')
309
            ->join('maj_sosa AS sosa_anc', function (JoinClause $join) use ($table_prefix): void {
310
                $join->on('sosa.majs_gen', '<', 'sosa_anc.majs_gen')
311
                    ->whereRaw('FLOOR(' . $table_prefix . 'sosa_anc.majs_sosa / POWER(2, ' .
312
                        $table_prefix . 'sosa_anc.majs_gen - ' . $table_prefix . 'sosa.majs_gen)) = ' .
313
                        $table_prefix . 'sosa.majs_sosa')
314
                    ->where('sosa_anc.majs_gedcom_id', '=', $this->tree->id())
315
                    ->where('sosa_anc.majs_user_id', '=', $this->user->id());
316
            })
317
            ->where('sosa.majs_gedcom_id', '=', $this->tree->id())
318
            ->where('sosa.majs_user_id', '=', $this->user->id())
319
            ->whereIn('sosa_anc.majs_i_id', function (Builder $query) use ($table_prefix): void {
320
                $query->from('maj_sosa AS sosa_gen')
321
                ->select('sosa_gen.majs_i_id')->distinct()
322
                ->where('sosa_gen.majs_gedcom_id', '=', $this->tree->id())
323
                ->where('sosa_gen.majs_user_id', '=', $this->user->id())
324
                ->whereRaw($table_prefix . 'sosa_gen.majs_gen = ' . $table_prefix . 'sosa.majs_gen');
325
            })
326
            ->groupBy(['sosa.majs_gen', 'sosa.majs_gedcom_id', 'sosa.majs_user_id',
327
                'sosa.majs_sosa', 'sosa.majs_i_id']);
328
329
        /* Compute the contribution of the nodes in the generation,
330
         * excluding the nodes with ancestors in the same generation.
331
         * Nodes with a parent missing are not excluded to cater for the missing one.
332
         */
333
        $known_ancestors_contributions = DB::table('maj_sosa AS sosa')
334
            ->select(['sosa.majs_gen AS gen', 'sosa.majs_gedcom_id', 'sosa.majs_user_id'])
335
            ->addSelect(['sosa.majs_i_id', 'sosa.majs_gen'])
336
            ->selectRaw('1 AS contrib')
337
            ->leftJoinSub($non_roots_ancestors, 'nonroot', function (JoinClause $join): void {
338
                $join->on('sosa.majs_gen', '=', 'nonroot.majs_gen')
339
                    ->on('sosa.majs_sosa', '=', 'nonroot.majs_sosa')
340
                    ->where('nonroot.full_ancestors', '>', 0)
341
                    ->where('nonroot.majs_gedcom_id', '=', $this->tree->id())
342
                    ->where('nonroot.majs_user_id', '=', $this->user->id());
343
            })
344
            ->where('sosa.majs_gedcom_id', '=', $this->tree->id())
345
            ->where('sosa.majs_user_id', '=', $this->user->id())
346
            ->whereNull('nonroot.majs_sosa');
347
348
        /* Aggregate both queries, and calculate the sum of contributions by generation roots.
349
         * Exclude as well nodes that already appear in lower generations, as their branche has already been reduced.
350
         */
351
        $ancestors_contributions_sum = DB::connection()->query()
352
            ->fromSub($root_ancestors_contributions->unionAll($known_ancestors_contributions), 'sosa_contribs')
353
            ->select(['sosa_contribs.gen', 'sosa_contribs.majs_gedcom_id', 'sosa_contribs.majs_user_id'])
354
            ->addSelect(['sosa_contribs.majs_i_id', 'sosa_contribs.contrib'])
355
            ->selectRaw('COUNT(' . $table_prefix . 'sosa_contribs.majs_i_id) * ' .
356
                $table_prefix . 'sosa_contribs.contrib AS totalContrib')
357
            ->leftJoin('maj_sosa AS sosa_low', function (JoinClause $join): void {
358
                $join->on('sosa_low.majs_gen', '<', 'sosa_contribs.majs_gen')
359
                    ->on('sosa_low.majs_i_id', '=', 'sosa_contribs.majs_i_id')
360
                    ->where('sosa_low.majs_gedcom_id', '=', $this->tree->id())
361
                    ->where('sosa_low.majs_user_id', '=', $this->user->id());
362
            })
363
            ->whereNull('sosa_low.majs_sosa')
364
            ->groupBy(['sosa_contribs.gen', 'sosa_contribs.majs_gedcom_id', 'sosa_contribs.majs_user_id',
365
                'sosa_contribs.majs_i_id', 'sosa_contribs.contrib']);
366
367
        // Aggregate all generation roots to compute root and generation pedigree collapse
368
        $pedi_collapse_coll = DB::connection()->query()->fromSub($ancestors_contributions_sum, 'sosa_contribs_sum')
369
            ->select(['gen'])->selectRaw('SUM(contrib), SUM(totalContrib)')
370
            ->selectRaw('1 - SUM(contrib) / SUM(totalContrib) AS pedi_collapse_roots')  // Roots/horizontal collapse
371
            ->selectRaw('1 - SUM(totalContrib) / POWER ( 2, gen - 1) AS pedi_collapse_xgen') // Crossgeneration collapse
372
            ->groupBy(['gen', 'majs_gedcom_id', 'majs_user_id'])
373
            ->orderBy('gen')
374
            ->get();
375
376
        $pedi_collapse_by_gen = [];
377
        foreach ($pedi_collapse_coll as $collapse_gen) {
378
            $pedi_collapse_by_gen[(int) $collapse_gen->gen] = array(
379
                'pedi_collapse_roots'   =>  (float) $collapse_gen->pedi_collapse_roots,
380
                'pedi_collapse_xgen'   =>  (float) $collapse_gen->pedi_collapse_xgen
381
            );
382
        }
383
        return $pedi_collapse_by_gen;
384
    }
385
386
    /**
387
     * Return a Collection of the mean generation depth and deviation for all Sosa ancestors at a given generation.
388
     * Sosa 1 is of generation 1.
389
     *
390
     * Mean generation depth and deviation are calculated based on the works of Marie-Héléne Cazes and Pierre Cazes,
391
     * published in Population (French Edition), Vol. 51, No. 1 (Jan. - Feb., 1996), pp. 117-140
392
     * http://kintip.net/index.php?option=com_jdownloads&task=download.send&id=9&catid=4&m=0
393
     *
394
     * Format:
395
     *  - key : sosa number of the ancestor
396
     *  - values:
397
     *      - root_ancestor_id : ID of the ancestor
398
     *      - mean_gen_depth : Mean generation depth
399
     *      - stddev_gen_depth : Standard deviation of generation depth
400
     *
401
     * @param int $gen Sosa generation
402
     * @return Collection<int, \stdClass>
403
     */
404
    public function generationDepthStatsAtGeneration(int $gen): Collection
405
    {
406
        if (!$this->isPdoSupported()) {
407
            return collect();
408
        }
409
410
        $table_prefix = DB::connection()->getTablePrefix();
411
        $missing_ancestors_by_gen = DB::table('maj_sosa AS sosa')
412
            ->selectRaw($table_prefix . 'sosa.majs_gen - ? AS majs_gen_norm', [$gen])
413
            ->selectRaw('FLOOR(((' . $table_prefix . 'sosa.majs_sosa / POW(2, ' . $table_prefix . 'sosa.majs_gen -1 )) - 1) * POWER(2, ? - 1)) + POWER(2, ? - 1) AS root_ancestor', [$gen, $gen])   //@phpcs:ignore Generic.Files.LineLength.TooLong
414
            ->selectRaw('SUM(CASE WHEN ' . $table_prefix . 'sosa_fat.majs_i_id IS NULL AND ' . $table_prefix . 'sosa_mot.majs_i_id IS NULL THEN 1 ELSE 0 END) AS full_root_count')  //@phpcs:ignore Generic.Files.LineLength.TooLong
415
            ->selectRaw('SUM(CASE WHEN ' . $table_prefix . 'sosa_fat.majs_i_id IS NULL AND ' . $table_prefix . 'sosa_mot.majs_i_id IS NULL THEN 0 ELSE 1 END) As semi_root_count')  //@phpcs:ignore Generic.Files.LineLength.TooLong
416
            ->leftJoin('maj_sosa AS sosa_fat', function (JoinClause $join) use ($table_prefix): void {
417
                // Link to sosa's father
418
                $join->whereRaw($table_prefix . 'sosa_fat.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa')
419
                ->where('sosa_fat.majs_gedcom_id', '=', $this->tree->id())
420
                ->where('sosa_fat.majs_user_id', '=', $this->user->id());
421
            })
422
            ->leftJoin('maj_sosa AS sosa_mot', function (JoinClause $join) use ($table_prefix): void {
423
                // Link to sosa's mother
424
                $join->whereRaw($table_prefix . 'sosa_mot.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa + 1')
425
                ->where('sosa_mot.majs_gedcom_id', '=', $this->tree->id())
426
                ->where('sosa_mot.majs_user_id', '=', $this->user->id());
427
            })
428
            ->where('sosa.majs_gedcom_id', '=', $this->tree->id())
429
            ->where('sosa.majs_user_id', '=', $this->user->id())
430
            ->where('sosa.majs_gen', '>=', $gen)
431
            ->where(function (Builder $query): void {
432
                $query->whereNull('sosa_fat.majs_i_id')
433
                    ->orWhereNull('sosa_mot.majs_i_id');
434
            })
435
            ->groupBy(['sosa.majs_gen', 'root_ancestor']);
436
437
        return DB::table('maj_sosa AS sosa_list')
438
            ->select(['stats_by_gen.root_ancestor AS root_ancestor_sosa', 'sosa_list.majs_i_id as root_ancestor_id'])
439
            ->selectRaw('1 + SUM( (majs_gen_norm) * ( 2 * full_root_count + semi_root_count) /  (2 * POWER(2, majs_gen_norm))) AS mean_gen_depth')  //@phpcs:ignore Generic.Files.LineLength.TooLong
440
            ->selectRaw(' SQRT(' .
441
                '   SUM(POWER(majs_gen_norm, 2) * ( 2 * full_root_count + semi_root_count) /  (2 * POWER(2, majs_gen_norm)))' .     //@phpcs:ignore Generic.Files.LineLength.TooLong
442
                '   - POWER( SUM( (majs_gen_norm) * ( 2 * full_root_count + semi_root_count) /  (2 * POWER(2, majs_gen_norm))), 2)' .       //@phpcs:ignore Generic.Files.LineLength.TooLong
443
                ' ) AS stddev_gen_depth')
444
            ->joinSub($missing_ancestors_by_gen, 'stats_by_gen', function (JoinClause $join): void {
445
                $join->on('sosa_list.majs_sosa', '=', 'stats_by_gen.root_ancestor')
446
                    ->where('sosa_list.majs_gedcom_id', '=', $this->tree->id())
447
                    ->where('sosa_list.majs_user_id', '=', $this->user->id());
448
            })
449
            ->groupBy(['stats_by_gen.root_ancestor', 'sosa_list.majs_i_id'])
450
            ->orderBy('stats_by_gen.root_ancestor')
451
            ->get()->keyBy('root_ancestor_sosa');
452
    }
453
454
    /**
455
     * Return a collection of the most duplicated root Sosa ancestors.
456
     * The number of ancestors to return is limited by the parameter $limit.
457
     * If several individuals are tied when reaching the limit, none of them are returned,
458
     * which means that there can be less individuals returned than requested.
459
     *
460
     * Format:
461
     *  - value:
462
     *      - sosa_i_id : sosa individual
463
     *      - sosa_count: number of duplications of the ancestor (e.g. 3 if it appears 3 times)
464
     *
465
     * @param int $limit
466
     * @return Collection<\stdClass>
467
     */
468
    public function topMultipleAncestorsWithNoTies(int $limit): Collection
469
    {
470
        $table_prefix = DB::connection()->getTablePrefix();
471
        $multiple_ancestors = DB::table('maj_sosa AS sosa')
472
            ->select('sosa.majs_i_id AS sosa_i_id')
473
            ->selectRaw('COUNT(' . $table_prefix . 'sosa.majs_sosa) AS sosa_count')
474
            ->leftJoin('maj_sosa AS sosa_fat', function (JoinClause $join) use ($table_prefix): void {
475
                // Link to sosa's father
476
                $join->whereRaw($table_prefix . 'sosa_fat.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa')
477
                    ->where('sosa_fat.majs_gedcom_id', '=', $this->tree->id())
478
                    ->where('sosa_fat.majs_user_id', '=', $this->user->id());
479
            })
480
            ->leftJoin('maj_sosa AS sosa_mot', function (JoinClause $join) use ($table_prefix): void {
481
                // Link to sosa's mother
482
                $join->whereRaw($table_prefix . 'sosa_mot.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa + 1')
483
                ->where('sosa_mot.majs_gedcom_id', '=', $this->tree->id())
484
                ->where('sosa_mot.majs_user_id', '=', $this->user->id());
485
            })
486
            ->where('sosa.majs_gedcom_id', '=', $this->tree->id())
487
            ->where('sosa.majs_user_id', '=', $this->user->id())
488
            ->whereNull('sosa_fat.majs_sosa')   // We keep only root individuals, i.e. those with no father or mother
489
            ->whereNull('sosa_mot.majs_sosa')
490
            ->groupBy('sosa.majs_i_id')
491
            ->havingRaw('COUNT(' . $table_prefix . 'sosa.majs_sosa) > 1')    // Limit to the duplicate sosas.
492
            ->orderByRaw('COUNT(' . $table_prefix . 'sosa.majs_sosa) DESC, MIN(' . $table_prefix . 'sosa.majs_sosa) ASC')   //@phpcs:ignore Generic.Files.LineLength.TooLong
493
            ->limit($limit + 1)     // We want to select one more than required, for ties
494
            ->get();
495
496
        if ($multiple_ancestors->count() > $limit) {
497
            $last_count = $multiple_ancestors->last()->sosa_count;
498
            $multiple_ancestors = $multiple_ancestors->reject(
499
                fn (stdClass $element): bool => $element->sosa_count ===  $last_count
500
            );
501
        }
502
        return $multiple_ancestors;
503
    }
504
505
    /**
506
     * Return a computed array of statistics about the dispersion of ancestors across the ancestors
507
     * at a specified generation.
508
     *
509
     * Format:
510
     *  - key : rank of the ancestor in generation G for which exclusive ancestors have been found
511
     *          For instance 3 represent the maternal grand father
512
     *          0 is used for shared ancestors
513
     *  - values:
514
     *      - branches: same as key
515
     *      - majs_i_id: xref of the ancestor at rank key in generation G, or null for shared ancestors
516
     *      - count_indi: number of ancestors exclusively in the ancestors of the ancestor at rank key
517
     *
518
     * For instance a result at generation 3 could be :
519
     * [
520
     *  0 => { branches: 0, majs_i_id: X1, count_indi: 12 } -> 12 ancestors are shared by the grand-parents
521
     *  1 => { branches: 1, majs_i_id: X2, count_indi: 32 } -> 32 ancestors are exclusive to the paternal grand-father
522
     *  2 => { branches: 2, majs_i_id: X3, count_indi: 25 } -> 25 ancestors are exclusive to the paternal grand-mother
523
     *  3 => { branches: 3, majs_i_id: X4, count_indi: 12 } -> 12 ancestors are exclusive to the maternal grand-father
524
     *  4 => { branches: 4, majs_i_id: X5, count_indi: 30 } -> 30 ancestors are exclusive to the maternal grand-mother
525
     * ]
526
     *
527
     * @param int $gen
528
     * @return Collection<int, \stdClass>
529
     */
530
    public function ancestorsDispersionForGeneration(int $gen): Collection
531
    {
532
        if (!$this->isPdoSupported()) {
533
            return collect();
534
        }
535
536
        $ancestors_branches = DB::table('maj_sosa')
537
            ->select('majs_i_id AS i_id')
538
            ->selectRaw('FLOOR(majs_sosa / POW(2, (majs_gen - ?))) - POW(2, ? -1) + 1 AS branch', [$gen, $gen])
539
            ->where('majs_gedcom_id', '=', $this->tree->id())
540
            ->where('majs_user_id', '=', $this->user->id())
541
            ->where('majs_gen', '>=', $gen)
542
            ->groupBy('majs_i_id', 'branch');
543
544
        $consolidated_ancestors_branches = DB::table('maj_sosa')
545
            ->fromSub($ancestors_branches, 'indi_branch')
546
            ->select('i_id')
547
            ->selectRaw('CASE WHEN COUNT(branch) > 1 THEN 0 ELSE MIN(branch) END AS branches')
548
            ->groupBy('i_id');
549
550
        return DB::table('maj_sosa')
551
            ->rightJoinSub(
552
                $consolidated_ancestors_branches,
553
                'indi_branch_consolidated',
554
                function (JoinClause $join) use ($gen): void {
555
                    $join->where('maj_sosa.majs_gedcom_id', '=', $this->tree->id())
556
                        ->where('maj_sosa.majs_user_id', '=', $this->user->id())
557
                        ->where('branches', '>', 0)
558
                        ->whereRaw('majs_sosa = POW(2, ? - 1) + branches - 1', [$gen]);
559
                }
560
            )
561
            ->select(['branches', 'majs_i_id'])
562
            ->selectRaw('COUNT(i_id) AS count_indi')
563
            ->groupBy(['branches', 'majs_i_id'])
564
            ->get()->keyBy('branches');
565
    }
566
}
567