1
|
|
|
<?php |
2
|
|
|
|
3
|
|
|
/** |
4
|
|
|
* webtrees-lib: MyArtJaub library for webtrees |
5
|
|
|
* |
6
|
|
|
* @package MyArtJaub\Webtrees |
7
|
|
|
* @subpackage Sosa |
8
|
|
|
* @author Jonathan Jaubart <[email protected]> |
9
|
|
|
* @copyright Copyright (c) 2009-2022, Jonathan Jaubart |
10
|
|
|
* @license http://www.gnu.org/licenses/gpl.html GNU General Public License, version 3 |
11
|
|
|
*/ |
12
|
|
|
|
13
|
|
|
declare(strict_types=1); |
14
|
|
|
|
15
|
|
|
namespace MyArtJaub\Webtrees\Module\Sosa\Services; |
16
|
|
|
|
17
|
|
|
use Fisharebest\Webtrees\Individual; |
18
|
|
|
use Fisharebest\Webtrees\Registry; |
19
|
|
|
use Fisharebest\Webtrees\Tree; |
20
|
|
|
use Fisharebest\Webtrees\Contracts\UserInterface; |
21
|
|
|
use Illuminate\Database\Capsule\Manager as DB; |
22
|
|
|
use Illuminate\Database\Query\Builder; |
23
|
|
|
use Illuminate\Database\Query\JoinClause; |
24
|
|
|
use Illuminate\Support\Collection; |
25
|
|
|
use stdClass; |
26
|
|
|
|
27
|
|
|
/** |
28
|
|
|
* Service for retrieving Sosa statistics |
29
|
|
|
*/ |
30
|
|
|
class SosaStatisticsService |
31
|
|
|
{ |
32
|
|
|
private UserInterface $user; |
33
|
|
|
private Tree $tree; |
34
|
|
|
|
35
|
|
|
/** |
36
|
|
|
* Constructor for Sosa Statistics Service |
37
|
|
|
* |
38
|
|
|
* @param Tree $tree |
39
|
|
|
* @param UserInterface $user |
40
|
|
|
*/ |
41
|
|
|
public function __construct(Tree $tree, UserInterface $user) |
42
|
|
|
{ |
43
|
|
|
$this->tree = $tree; |
44
|
|
|
$this->user = $user; |
45
|
|
|
} |
46
|
|
|
|
47
|
|
|
/** |
48
|
|
|
* Check if PDO support the queries used in Sosa statistics. |
49
|
|
|
* |
50
|
|
|
* SQLite does not support RIGHT and FULL JOIN, and POWER/SQRT require a specific compilation flag. |
51
|
|
|
* |
52
|
|
|
* @return bool |
53
|
|
|
*/ |
54
|
|
|
public function isPdoSupported(): bool |
55
|
|
|
{ |
56
|
|
|
return DB::connection()->getDriverName() !== 'sqlite'; |
57
|
|
|
} |
58
|
|
|
|
59
|
|
|
/** |
60
|
|
|
* Return the root individual for the reference tree and user. |
61
|
|
|
* |
62
|
|
|
* @return Individual|NULL |
63
|
|
|
*/ |
64
|
|
|
public function rootIndividual(): ?Individual |
65
|
|
|
{ |
66
|
|
|
$root_indi_id = $this->tree->getUserPreference($this->user, 'MAJ_SOSA_ROOT_ID'); |
67
|
|
|
return Registry::individualFactory()->make($root_indi_id, $this->tree); |
68
|
|
|
} |
69
|
|
|
|
70
|
|
|
/** |
71
|
|
|
* Get the highest generation for the reference tree and user. |
72
|
|
|
* |
73
|
|
|
* @return int |
74
|
|
|
*/ |
75
|
|
|
public function maxGeneration(): int |
76
|
|
|
{ |
77
|
|
|
return (int) DB::table('maj_sosa') |
78
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
79
|
|
|
->where('majs_user_id', '=', $this->user->id()) |
80
|
|
|
->max('majs_gen'); |
81
|
|
|
} |
82
|
|
|
|
83
|
|
|
/** |
84
|
|
|
* Get the total count of individuals in the tree. |
85
|
|
|
* |
86
|
|
|
* @return int |
87
|
|
|
*/ |
88
|
|
|
public function totalIndividuals(): int |
89
|
|
|
{ |
90
|
|
|
return DB::table('individuals') |
91
|
|
|
->where('i_file', '=', $this->tree->id()) |
92
|
|
|
->count(); |
93
|
|
|
} |
94
|
|
|
|
95
|
|
|
/** |
96
|
|
|
* Get the total count of Sosa ancestors for all generations |
97
|
|
|
* |
98
|
|
|
* @return int |
99
|
|
|
*/ |
100
|
|
|
public function totalAncestors(): int |
101
|
|
|
{ |
102
|
|
|
return DB::table('maj_sosa') |
103
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
104
|
|
|
->where('majs_user_id', '=', $this->user->id()) |
105
|
|
|
->count(); |
106
|
|
|
} |
107
|
|
|
|
108
|
|
|
/** |
109
|
|
|
* Get the total count of Sosa ancestors for a generation |
110
|
|
|
* |
111
|
|
|
* @return int |
112
|
|
|
*/ |
113
|
|
|
public function totalAncestorsAtGeneration(int $gen): int |
114
|
|
|
{ |
115
|
|
|
return DB::table('maj_sosa') |
116
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
117
|
|
|
->where('majs_user_id', '=', $this->user->id()) |
118
|
|
|
->where('majs_gen', '=', $gen) |
119
|
|
|
->count(); |
120
|
|
|
} |
121
|
|
|
|
122
|
|
|
/** |
123
|
|
|
* Get the total count of distinct Sosa ancestors for all generations |
124
|
|
|
* |
125
|
|
|
* @return int |
126
|
|
|
*/ |
127
|
|
|
public function totalDistinctAncestors(): int |
128
|
|
|
{ |
129
|
|
|
return DB::table('maj_sosa') |
130
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
131
|
|
|
->where('majs_user_id', '=', $this->user->id()) |
132
|
|
|
->distinct() |
133
|
|
|
->count('majs_i_id'); |
134
|
|
|
} |
135
|
|
|
|
136
|
|
|
/** |
137
|
|
|
* Get the mean generation time, as the slope of the linear regression of birth years vs generations |
138
|
|
|
* |
139
|
|
|
* @return float |
140
|
|
|
*/ |
141
|
|
|
public function meanGenerationTime(): float |
142
|
|
|
{ |
143
|
|
|
$row = DB::table('maj_sosa') |
144
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
145
|
|
|
->where('majs_user_id', '=', $this->user->id()) |
146
|
|
|
->whereNotNull('majs_birth_year') |
147
|
|
|
->selectRaw('COUNT(majs_sosa) AS n') |
148
|
|
|
->selectRaw('SUM(majs_gen * majs_birth_year) AS sum_xy') |
149
|
|
|
->selectRaw('SUM(majs_gen) AS sum_x') |
150
|
|
|
->selectRaw('SUM(majs_birth_year) AS sum_y') |
151
|
|
|
->selectRaw('SUM(majs_gen * majs_gen) AS sum_x2') |
152
|
|
|
->get()->first(); |
153
|
|
|
|
154
|
|
|
$denom = $row->n * $row->sum_x2 - pow($row->sum_x, 2); |
155
|
|
|
return ((int) $row->n === 0 || $denom === 0) ? 0 : |
156
|
|
|
-($row->n * $row->sum_xy - $row->sum_x * $row->sum_y) / $denom; |
157
|
|
|
} |
158
|
|
|
|
159
|
|
|
/** |
160
|
|
|
* Get the statistic array detailed by generation. |
161
|
|
|
* Statistics for each generation are: |
162
|
|
|
* - The number of Sosa in generation |
163
|
|
|
* - The number of Sosa up to generation |
164
|
|
|
* - The number of distinct Sosa up to generation |
165
|
|
|
* - The year of the first birth in generation |
166
|
|
|
* - The year of the first estimated birth in generation |
167
|
|
|
* - The year of the last birth in generation |
168
|
|
|
* - The year of the last estimated birth in generation |
169
|
|
|
* - The average year of birth in generation |
170
|
|
|
* |
171
|
|
|
* @return array<int, array<string, int|null>> Statistics array |
172
|
|
|
*/ |
173
|
|
|
public function statisticsByGenerations(): array |
174
|
|
|
{ |
175
|
|
|
$stats_by_gen = $this->statisticsByGenerationBasicData(); |
176
|
|
|
$cumul_stats_by_gen = $this->statisticsByGenerationCumulativeData(); |
177
|
|
|
|
178
|
|
|
$statistics_by_gen = []; |
179
|
|
|
foreach ($stats_by_gen as $gen => $stats_gen) { |
180
|
|
|
$statistics_by_gen[(int) $stats_gen->gen] = array( |
181
|
|
|
'sosaCount' => (int) $stats_gen->total_sosa, |
182
|
|
|
'sosaTotalCount' => (int) $cumul_stats_by_gen[$gen]->total_cumul, |
183
|
|
|
'diffSosaTotalCount' => (int) $cumul_stats_by_gen[$gen]->total_distinct_cumul, |
184
|
|
|
'firstBirth' => $stats_gen->first_year, |
185
|
|
|
'firstEstimatedBirth' => $stats_gen->first_est_year, |
186
|
|
|
'lastBirth' => $stats_gen->last_year, |
187
|
|
|
'lastEstimatedBirth' => $stats_gen->last_est_year |
188
|
|
|
); |
189
|
|
|
} |
190
|
|
|
|
191
|
|
|
return $statistics_by_gen; |
192
|
|
|
} |
193
|
|
|
|
194
|
|
|
/** |
195
|
|
|
* Returns the basic statistics data by generation. |
196
|
|
|
* |
197
|
|
|
* @return Collection<int, \stdClass> |
198
|
|
|
*/ |
199
|
|
|
private function statisticsByGenerationBasicData(): Collection |
200
|
|
|
{ |
201
|
|
|
return DB::table('maj_sosa') |
202
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
203
|
|
|
->where('majs_user_id', '=', $this->user->id()) |
204
|
|
|
->groupBy('majs_gen') |
205
|
|
|
->orderBy('majs_gen', 'asc') |
206
|
|
|
->select('majs_gen AS gen') |
207
|
|
|
->selectRaw('COUNT(majs_sosa) AS total_sosa') |
208
|
|
|
->selectRaw('MIN(majs_birth_year) AS first_year') |
209
|
|
|
->selectRaw('MIN(majs_birth_year_est) AS first_est_year') |
210
|
|
|
->selectRaw('MAX(majs_birth_year) AS last_year') |
211
|
|
|
->selectRaw('MAX(majs_birth_year_est) AS last_est_year') |
212
|
|
|
->get()->keyBy('gen'); |
213
|
|
|
} |
214
|
|
|
|
215
|
|
|
/** |
216
|
|
|
* Returns the cumulative statistics data by generation |
217
|
|
|
* |
218
|
|
|
* @return Collection<int, \stdClass> |
219
|
|
|
*/ |
220
|
|
|
private function statisticsByGenerationCumulativeData(): Collection |
221
|
|
|
{ |
222
|
|
|
$list_gen = DB::table('maj_sosa')->select('majs_gen')->distinct() |
223
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
224
|
|
|
->where('majs_user_id', '=', $this->user->id()); |
225
|
|
|
|
226
|
|
|
return DB::table('maj_sosa') |
227
|
|
|
->joinSub($list_gen, 'list_gen', function (JoinClause $join): void { |
228
|
|
|
$join->on('maj_sosa.majs_gen', '<=', 'list_gen.majs_gen') |
229
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
230
|
|
|
->where('majs_user_id', '=', $this->user->id()); |
231
|
|
|
}) |
232
|
|
|
->groupBy('list_gen.majs_gen') |
233
|
|
|
->select('list_gen.majs_gen AS gen') |
234
|
|
|
->selectRaw('COUNT(majs_i_id) AS total_cumul') |
235
|
|
|
->selectRaw('COUNT(DISTINCT majs_i_id) AS total_distinct_cumul') |
236
|
|
|
->selectRaw('1 - COUNT(DISTINCT majs_i_id) / COUNT(majs_i_id) AS pedi_collapse_simple') |
237
|
|
|
->get()->keyBy('gen'); |
238
|
|
|
} |
239
|
|
|
|
240
|
|
|
/** |
241
|
|
|
* Returns the pedigree collapse improved calculation by generation. |
242
|
|
|
* |
243
|
|
|
* Format: |
244
|
|
|
* - key : generation |
245
|
|
|
* - values: |
246
|
|
|
* - pedi_collapse_roots : pedigree collapse of ancestor roots for the generation |
247
|
|
|
* - pedi_collapse_xgen : pedigree cross-generation shrinkage for the generation |
248
|
|
|
* |
249
|
|
|
* @return array<int, array<string, float>> |
250
|
|
|
*/ |
251
|
|
|
public function pedigreeCollapseByGenerationData(): array |
252
|
|
|
{ |
253
|
|
|
if (!$this->isPdoSupported()) { |
254
|
|
|
return []; |
255
|
|
|
} |
256
|
|
|
|
257
|
|
|
$table_prefix = DB::connection()->getTablePrefix(); |
258
|
|
|
|
259
|
|
|
$list_gen = DB::table('maj_sosa')->select('majs_gen')->distinct() |
260
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
261
|
|
|
->where('majs_user_id', '=', $this->user->id()); |
262
|
|
|
|
263
|
|
|
/* Compute the contributions of nodes of previous generations to the current generation */ |
264
|
|
|
$root_ancestors_contributions = DB::table('maj_sosa AS sosa') |
265
|
|
|
->select(['list_gen.majs_gen AS gen', 'sosa.majs_gedcom_id', 'sosa.majs_user_id']) |
266
|
|
|
->addSelect(['sosa.majs_i_id', 'sosa.majs_gen']) |
267
|
|
|
->selectRaw( |
268
|
|
|
'(CASE ' . |
269
|
|
|
' WHEN ' . $table_prefix . 'sosa_fat.majs_i_id IS NULL' . |
270
|
|
|
' THEN POWER(2, ' . $table_prefix . 'list_gen.majs_gen - ' . $table_prefix . 'sosa.majs_gen - 1)' . |
271
|
|
|
' ELSE 0 ' . |
272
|
|
|
' END)' . |
273
|
|
|
' + (CASE ' . |
274
|
|
|
' WHEN ' . $table_prefix . 'sosa_mot.majs_i_id IS NULL' . |
275
|
|
|
' THEN POWER(2, ' . $table_prefix . 'list_gen.majs_gen - ' . $table_prefix . 'sosa.majs_gen - 1)' . |
276
|
|
|
' ELSE 0 ' . |
277
|
|
|
' END) contrib' |
278
|
|
|
) |
279
|
|
|
->joinSub($list_gen, 'list_gen', function (JoinClause $join): void { |
280
|
|
|
$join->on('sosa.majs_gen', '<', 'list_gen.majs_gen') |
281
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
282
|
|
|
->where('majs_user_id', '=', $this->user->id()); |
283
|
|
|
}) |
284
|
|
|
->leftJoin('maj_sosa AS sosa_fat', function (JoinClause $join) use ($table_prefix): void { |
285
|
|
|
// Link to sosa's father |
286
|
|
|
$join->whereRaw($table_prefix . 'sosa_fat.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa') |
287
|
|
|
->where('sosa_fat.majs_gedcom_id', '=', $this->tree->id()) |
288
|
|
|
->where('sosa_fat.majs_user_id', '=', $this->user->id()); |
289
|
|
|
}) |
290
|
|
|
->leftJoin('maj_sosa AS sosa_mot', function (JoinClause $join) use ($table_prefix): void { |
291
|
|
|
// Link to sosa's mother |
292
|
|
|
$join->whereRaw($table_prefix . 'sosa_mot.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa + 1') |
293
|
|
|
->where('sosa_mot.majs_gedcom_id', '=', $this->tree->id()) |
294
|
|
|
->where('sosa_mot.majs_user_id', '=', $this->user->id()); |
295
|
|
|
}) |
296
|
|
|
->where('sosa.majs_gedcom_id', '=', $this->tree->id()) |
297
|
|
|
->where('sosa.majs_user_id', '=', $this->user->id()) |
298
|
|
|
->where(function (Builder $query): void { |
299
|
|
|
$query->whereNull('sosa_fat.majs_i_id') |
300
|
|
|
->orWhereNull('sosa_mot.majs_i_id'); |
301
|
|
|
}); |
302
|
|
|
|
303
|
|
|
/* Identify nodes in the generations with ancestors who are also in the same generation. |
304
|
|
|
* This is the vertical/generational collapse that will reduce the number or roots. |
305
|
|
|
*/ |
306
|
|
|
$non_roots_ancestors = DB::table('maj_sosa AS sosa') |
307
|
|
|
->select(['sosa.majs_gen', 'sosa.majs_gedcom_id', 'sosa.majs_user_id', 'sosa.majs_sosa']) |
308
|
|
|
->selectRaw('MAX(' . $table_prefix . 'sosa_anc.majs_sosa) - MIN(' . $table_prefix . 'sosa_anc.majs_sosa)' . |
309
|
|
|
' AS full_ancestors') |
310
|
|
|
->join('maj_sosa AS sosa_anc', function (JoinClause $join) use ($table_prefix): void { |
311
|
|
|
$join->on('sosa.majs_gen', '<', 'sosa_anc.majs_gen') |
312
|
|
|
->whereRaw('FLOOR(' . $table_prefix . 'sosa_anc.majs_sosa / POWER(2, ' . |
313
|
|
|
$table_prefix . 'sosa_anc.majs_gen - ' . $table_prefix . 'sosa.majs_gen)) = ' . |
314
|
|
|
$table_prefix . 'sosa.majs_sosa') |
315
|
|
|
->where('sosa_anc.majs_gedcom_id', '=', $this->tree->id()) |
316
|
|
|
->where('sosa_anc.majs_user_id', '=', $this->user->id()); |
317
|
|
|
}) |
318
|
|
|
->where('sosa.majs_gedcom_id', '=', $this->tree->id()) |
319
|
|
|
->where('sosa.majs_user_id', '=', $this->user->id()) |
320
|
|
|
->whereIn('sosa_anc.majs_i_id', function (Builder $query) use ($table_prefix): void { |
321
|
|
|
$query->from('maj_sosa AS sosa_gen') |
322
|
|
|
->select('sosa_gen.majs_i_id')->distinct() |
323
|
|
|
->where('sosa_gen.majs_gedcom_id', '=', $this->tree->id()) |
324
|
|
|
->where('sosa_gen.majs_user_id', '=', $this->user->id()) |
325
|
|
|
->whereRaw($table_prefix . 'sosa_gen.majs_gen = ' . $table_prefix . 'sosa.majs_gen'); |
326
|
|
|
}) |
327
|
|
|
->groupBy(['sosa.majs_gen', 'sosa.majs_gedcom_id', 'sosa.majs_user_id', |
328
|
|
|
'sosa.majs_sosa', 'sosa.majs_i_id']); |
329
|
|
|
|
330
|
|
|
/* Compute the contribution of the nodes in the generation, |
331
|
|
|
* excluding the nodes with ancestors in the same generation. |
332
|
|
|
* Nodes with a parent missing are not excluded to cater for the missing one. |
333
|
|
|
*/ |
334
|
|
|
$known_ancestors_contributions = DB::table('maj_sosa AS sosa') |
335
|
|
|
->select(['sosa.majs_gen AS gen', 'sosa.majs_gedcom_id', 'sosa.majs_user_id']) |
336
|
|
|
->addSelect(['sosa.majs_i_id', 'sosa.majs_gen']) |
337
|
|
|
->selectRaw('1 AS contrib') |
338
|
|
|
->leftJoinSub($non_roots_ancestors, 'nonroot', function (JoinClause $join): void { |
339
|
|
|
$join->on('sosa.majs_gen', '=', 'nonroot.majs_gen') |
340
|
|
|
->on('sosa.majs_sosa', '=', 'nonroot.majs_sosa') |
341
|
|
|
->where('nonroot.full_ancestors', '>', 0) |
342
|
|
|
->where('nonroot.majs_gedcom_id', '=', $this->tree->id()) |
343
|
|
|
->where('nonroot.majs_user_id', '=', $this->user->id()); |
344
|
|
|
}) |
345
|
|
|
->where('sosa.majs_gedcom_id', '=', $this->tree->id()) |
346
|
|
|
->where('sosa.majs_user_id', '=', $this->user->id()) |
347
|
|
|
->whereNull('nonroot.majs_sosa'); |
348
|
|
|
|
349
|
|
|
/* Aggregate both queries, and calculate the sum of contributions by generation roots. |
350
|
|
|
* Exclude as well nodes that already appear in lower generations, as their branche has already been reduced. |
351
|
|
|
*/ |
352
|
|
|
$ancestors_contributions_sum = DB::connection()->query() |
353
|
|
|
->fromSub($root_ancestors_contributions->unionAll($known_ancestors_contributions), 'sosa_contribs') |
354
|
|
|
->select(['sosa_contribs.gen', 'sosa_contribs.majs_gedcom_id', 'sosa_contribs.majs_user_id']) |
355
|
|
|
->addSelect(['sosa_contribs.majs_i_id', 'sosa_contribs.contrib']) |
356
|
|
|
->selectRaw('COUNT(' . $table_prefix . 'sosa_contribs.majs_i_id) * ' . |
357
|
|
|
$table_prefix . 'sosa_contribs.contrib AS totalContrib') |
358
|
|
|
->leftJoin('maj_sosa AS sosa_low', function (JoinClause $join): void { |
359
|
|
|
$join->on('sosa_low.majs_gen', '<', 'sosa_contribs.majs_gen') |
360
|
|
|
->on('sosa_low.majs_i_id', '=', 'sosa_contribs.majs_i_id') |
361
|
|
|
->where('sosa_low.majs_gedcom_id', '=', $this->tree->id()) |
362
|
|
|
->where('sosa_low.majs_user_id', '=', $this->user->id()); |
363
|
|
|
}) |
364
|
|
|
->whereNull('sosa_low.majs_sosa') |
365
|
|
|
->groupBy(['sosa_contribs.gen', 'sosa_contribs.majs_gedcom_id', 'sosa_contribs.majs_user_id', |
366
|
|
|
'sosa_contribs.majs_i_id', 'sosa_contribs.contrib']); |
367
|
|
|
|
368
|
|
|
// Aggregate all generation roots to compute root and generation pedigree collapse |
369
|
|
|
$pedi_collapse_coll = DB::connection()->query()->fromSub($ancestors_contributions_sum, 'sosa_contribs_sum') |
370
|
|
|
->select(['gen'])->selectRaw('SUM(contrib), SUM(totalContrib)') |
371
|
|
|
->selectRaw('1 - SUM(contrib) / SUM(totalContrib) AS pedi_collapse_roots') // Roots/horizontal collapse |
372
|
|
|
->selectRaw('1 - SUM(totalContrib) / POWER ( 2, gen - 1) AS pedi_collapse_xgen') // Crossgeneration collapse |
373
|
|
|
->groupBy(['gen', 'majs_gedcom_id', 'majs_user_id']) |
374
|
|
|
->orderBy('gen') |
375
|
|
|
->get(); |
376
|
|
|
|
377
|
|
|
$pedi_collapse_by_gen = []; |
378
|
|
|
foreach ($pedi_collapse_coll as $collapse_gen) { |
379
|
|
|
$pedi_collapse_by_gen[(int) $collapse_gen->gen] = array( |
380
|
|
|
'pedi_collapse_roots' => (float) $collapse_gen->pedi_collapse_roots, |
381
|
|
|
'pedi_collapse_xgen' => (float) $collapse_gen->pedi_collapse_xgen |
382
|
|
|
); |
383
|
|
|
} |
384
|
|
|
return $pedi_collapse_by_gen; |
385
|
|
|
} |
386
|
|
|
|
387
|
|
|
/** |
388
|
|
|
* Return a Collection of the mean generation depth and deviation for all Sosa ancestors at a given generation. |
389
|
|
|
* Sosa 1 is of generation 1. |
390
|
|
|
* |
391
|
|
|
* Mean generation depth and deviation are calculated based on the works of Marie-Héléne Cazes and Pierre Cazes, |
392
|
|
|
* published in Population (French Edition), Vol. 51, No. 1 (Jan. - Feb., 1996), pp. 117-140 |
393
|
|
|
* http://kintip.net/index.php?option=com_jdownloads&task=download.send&id=9&catid=4&m=0 |
394
|
|
|
* |
395
|
|
|
* Format: |
396
|
|
|
* - key : sosa number of the ancestor |
397
|
|
|
* - values: |
398
|
|
|
* - root_ancestor_id : ID of the ancestor |
399
|
|
|
* - mean_gen_depth : Mean generation depth |
400
|
|
|
* - stddev_gen_depth : Standard deviation of generation depth |
401
|
|
|
* |
402
|
|
|
* @param int $gen Sosa generation |
403
|
|
|
* @return Collection<int, \stdClass> |
404
|
|
|
*/ |
405
|
|
|
public function generationDepthStatsAtGeneration(int $gen): Collection |
406
|
|
|
{ |
407
|
|
|
if (!$this->isPdoSupported()) { |
408
|
|
|
return collect(); |
409
|
|
|
} |
410
|
|
|
|
411
|
|
|
$table_prefix = DB::connection()->getTablePrefix(); |
412
|
|
|
$missing_ancestors_by_gen = DB::table('maj_sosa AS sosa') |
413
|
|
|
->selectRaw($table_prefix . 'sosa.majs_gen - ? AS majs_gen_norm', [$gen]) |
414
|
|
|
->selectRaw('FLOOR(((' . $table_prefix . 'sosa.majs_sosa / POW(2, ' . $table_prefix . 'sosa.majs_gen -1 )) - 1) * POWER(2, ? - 1)) + POWER(2, ? - 1) AS root_ancestor', [$gen, $gen]) //@phpcs:ignore Generic.Files.LineLength.TooLong |
415
|
|
|
->selectRaw('SUM(CASE WHEN ' . $table_prefix . 'sosa_fat.majs_i_id IS NULL AND ' . $table_prefix . 'sosa_mot.majs_i_id IS NULL THEN 1 ELSE 0 END) AS full_root_count') //@phpcs:ignore Generic.Files.LineLength.TooLong |
416
|
|
|
->selectRaw('SUM(CASE WHEN ' . $table_prefix . 'sosa_fat.majs_i_id IS NULL AND ' . $table_prefix . 'sosa_mot.majs_i_id IS NULL THEN 0 ELSE 1 END) As semi_root_count') //@phpcs:ignore Generic.Files.LineLength.TooLong |
417
|
|
|
->leftJoin('maj_sosa AS sosa_fat', function (JoinClause $join) use ($table_prefix): void { |
418
|
|
|
// Link to sosa's father |
419
|
|
|
$join->whereRaw($table_prefix . 'sosa_fat.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa') |
420
|
|
|
->where('sosa_fat.majs_gedcom_id', '=', $this->tree->id()) |
421
|
|
|
->where('sosa_fat.majs_user_id', '=', $this->user->id()); |
422
|
|
|
}) |
423
|
|
|
->leftJoin('maj_sosa AS sosa_mot', function (JoinClause $join) use ($table_prefix): void { |
424
|
|
|
// Link to sosa's mother |
425
|
|
|
$join->whereRaw($table_prefix . 'sosa_mot.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa + 1') |
426
|
|
|
->where('sosa_mot.majs_gedcom_id', '=', $this->tree->id()) |
427
|
|
|
->where('sosa_mot.majs_user_id', '=', $this->user->id()); |
428
|
|
|
}) |
429
|
|
|
->where('sosa.majs_gedcom_id', '=', $this->tree->id()) |
430
|
|
|
->where('sosa.majs_user_id', '=', $this->user->id()) |
431
|
|
|
->where('sosa.majs_gen', '>=', $gen) |
432
|
|
|
->where(function (Builder $query): void { |
433
|
|
|
$query->whereNull('sosa_fat.majs_i_id') |
434
|
|
|
->orWhereNull('sosa_mot.majs_i_id'); |
435
|
|
|
}) |
436
|
|
|
->groupBy(['sosa.majs_gen', 'root_ancestor']); |
437
|
|
|
|
438
|
|
|
return DB::table('maj_sosa AS sosa_list') |
439
|
|
|
->select(['stats_by_gen.root_ancestor AS root_ancestor_sosa', 'sosa_list.majs_i_id as root_ancestor_id']) |
440
|
|
|
->selectRaw('1 + SUM( (majs_gen_norm) * ( 2 * full_root_count + semi_root_count) / (2 * POWER(2, majs_gen_norm))) AS mean_gen_depth') //@phpcs:ignore Generic.Files.LineLength.TooLong |
441
|
|
|
->selectRaw(' SQRT(' . |
442
|
|
|
' SUM(POWER(majs_gen_norm, 2) * ( 2 * full_root_count + semi_root_count) / (2 * POWER(2, majs_gen_norm)))' . //@phpcs:ignore Generic.Files.LineLength.TooLong |
443
|
|
|
' - POWER( SUM( (majs_gen_norm) * ( 2 * full_root_count + semi_root_count) / (2 * POWER(2, majs_gen_norm))), 2)' . //@phpcs:ignore Generic.Files.LineLength.TooLong |
444
|
|
|
' ) AS stddev_gen_depth') |
445
|
|
|
->joinSub($missing_ancestors_by_gen, 'stats_by_gen', function (JoinClause $join): void { |
446
|
|
|
$join->on('sosa_list.majs_sosa', '=', 'stats_by_gen.root_ancestor') |
447
|
|
|
->where('sosa_list.majs_gedcom_id', '=', $this->tree->id()) |
448
|
|
|
->where('sosa_list.majs_user_id', '=', $this->user->id()); |
449
|
|
|
}) |
450
|
|
|
->groupBy(['stats_by_gen.root_ancestor', 'sosa_list.majs_i_id']) |
451
|
|
|
->orderBy('stats_by_gen.root_ancestor') |
452
|
|
|
->get()->keyBy('root_ancestor_sosa'); |
453
|
|
|
} |
454
|
|
|
|
455
|
|
|
/** |
456
|
|
|
* Return a collection of the most duplicated root Sosa ancestors. |
457
|
|
|
* The number of ancestors to return is limited by the parameter $limit. |
458
|
|
|
* If several individuals are tied when reaching the limit, none of them are returned, |
459
|
|
|
* which means that there can be less individuals returned than requested. |
460
|
|
|
* |
461
|
|
|
* Format: |
462
|
|
|
* - value: |
463
|
|
|
* - sosa_i_id : sosa individual |
464
|
|
|
* - sosa_count: number of duplications of the ancestor (e.g. 3 if it appears 3 times) |
465
|
|
|
* |
466
|
|
|
* @param int $limit |
467
|
|
|
* @return Collection<\stdClass> |
468
|
|
|
*/ |
469
|
|
|
public function topMultipleAncestorsWithNoTies(int $limit): Collection |
470
|
|
|
{ |
471
|
|
|
$table_prefix = DB::connection()->getTablePrefix(); |
472
|
|
|
$multiple_ancestors = DB::table('maj_sosa AS sosa') |
473
|
|
|
->select('sosa.majs_i_id AS sosa_i_id') |
474
|
|
|
->selectRaw('COUNT(' . $table_prefix . 'sosa.majs_sosa) AS sosa_count') |
475
|
|
|
->leftJoin('maj_sosa AS sosa_fat', function (JoinClause $join) use ($table_prefix): void { |
476
|
|
|
// Link to sosa's father |
477
|
|
|
$join->whereRaw($table_prefix . 'sosa_fat.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa') |
478
|
|
|
->where('sosa_fat.majs_gedcom_id', '=', $this->tree->id()) |
479
|
|
|
->where('sosa_fat.majs_user_id', '=', $this->user->id()); |
480
|
|
|
}) |
481
|
|
|
->leftJoin('maj_sosa AS sosa_mot', function (JoinClause $join) use ($table_prefix): void { |
482
|
|
|
// Link to sosa's mother |
483
|
|
|
$join->whereRaw($table_prefix . 'sosa_mot.majs_sosa = 2 * ' . $table_prefix . 'sosa.majs_sosa + 1') |
484
|
|
|
->where('sosa_mot.majs_gedcom_id', '=', $this->tree->id()) |
485
|
|
|
->where('sosa_mot.majs_user_id', '=', $this->user->id()); |
486
|
|
|
}) |
487
|
|
|
->where('sosa.majs_gedcom_id', '=', $this->tree->id()) |
488
|
|
|
->where('sosa.majs_user_id', '=', $this->user->id()) |
489
|
|
|
->whereNull('sosa_fat.majs_sosa') // We keep only root individuals, i.e. those with no father or mother |
490
|
|
|
->whereNull('sosa_mot.majs_sosa') |
491
|
|
|
->groupBy('sosa.majs_i_id') |
492
|
|
|
->havingRaw('COUNT(' . $table_prefix . 'sosa.majs_sosa) > 1') // Limit to the duplicate sosas. |
493
|
|
|
->orderByRaw('COUNT(' . $table_prefix . 'sosa.majs_sosa) DESC, MIN(' . $table_prefix . 'sosa.majs_sosa) ASC') //@phpcs:ignore Generic.Files.LineLength.TooLong |
494
|
|
|
->limit($limit + 1) // We want to select one more than required, for ties |
495
|
|
|
->get(); |
496
|
|
|
|
497
|
|
|
if ($multiple_ancestors->count() > $limit) { |
498
|
|
|
$last_count = $multiple_ancestors->last()->sosa_count; |
499
|
|
|
$multiple_ancestors = $multiple_ancestors->reject( |
500
|
|
|
fn (stdClass $element): bool => $element->sosa_count === $last_count |
501
|
|
|
); |
502
|
|
|
} |
503
|
|
|
return $multiple_ancestors; |
504
|
|
|
} |
505
|
|
|
|
506
|
|
|
/** |
507
|
|
|
* Return a computed array of statistics about the dispersion of ancestors across the ancestors |
508
|
|
|
* at a specified generation. |
509
|
|
|
* |
510
|
|
|
* Format: |
511
|
|
|
* - key : rank of the ancestor in generation G for which exclusive ancestors have been found |
512
|
|
|
* For instance 3 represent the maternal grand father |
513
|
|
|
* 0 is used for shared ancestors |
514
|
|
|
* - values: |
515
|
|
|
* - branches: same as key |
516
|
|
|
* - majs_i_id: xref of the ancestor at rank key in generation G, or null for shared ancestors |
517
|
|
|
* - count_indi: number of ancestors exclusively in the ancestors of the ancestor at rank key |
518
|
|
|
* |
519
|
|
|
* For instance a result at generation 3 could be : |
520
|
|
|
* [ |
521
|
|
|
* 0 => { branches: 0, majs_i_id: X1, count_indi: 12 } -> 12 ancestors are shared by the grand-parents |
522
|
|
|
* 1 => { branches: 1, majs_i_id: X2, count_indi: 32 } -> 32 ancestors are exclusive to the paternal grand-father |
523
|
|
|
* 2 => { branches: 2, majs_i_id: X3, count_indi: 25 } -> 25 ancestors are exclusive to the paternal grand-mother |
524
|
|
|
* 3 => { branches: 3, majs_i_id: X4, count_indi: 12 } -> 12 ancestors are exclusive to the maternal grand-father |
525
|
|
|
* 4 => { branches: 4, majs_i_id: X5, count_indi: 30 } -> 30 ancestors are exclusive to the maternal grand-mother |
526
|
|
|
* ] |
527
|
|
|
* |
528
|
|
|
* @param int $gen |
529
|
|
|
* @return Collection<int, \stdClass> |
530
|
|
|
*/ |
531
|
|
|
public function ancestorsDispersionForGeneration(int $gen): Collection |
532
|
|
|
{ |
533
|
|
|
if (!$this->isPdoSupported()) { |
534
|
|
|
return collect(); |
535
|
|
|
} |
536
|
|
|
|
537
|
|
|
$ancestors_branches = DB::table('maj_sosa') |
538
|
|
|
->select('majs_i_id AS i_id') |
539
|
|
|
->selectRaw('FLOOR(majs_sosa / POW(2, (majs_gen - ?))) - POW(2, ? -1) + 1 AS branch', [$gen, $gen]) |
540
|
|
|
->where('majs_gedcom_id', '=', $this->tree->id()) |
541
|
|
|
->where('majs_user_id', '=', $this->user->id()) |
542
|
|
|
->where('majs_gen', '>=', $gen) |
543
|
|
|
->groupBy('majs_i_id', 'branch'); |
544
|
|
|
|
545
|
|
|
$consolidated_ancestors_branches = DB::table('maj_sosa') |
546
|
|
|
->fromSub($ancestors_branches, 'indi_branch') |
547
|
|
|
->select('i_id') |
548
|
|
|
->selectRaw('CASE WHEN COUNT(branch) > 1 THEN 0 ELSE MIN(branch) END AS branches') |
549
|
|
|
->groupBy('i_id'); |
550
|
|
|
|
551
|
|
|
return DB::table('maj_sosa') |
552
|
|
|
->rightJoinSub( |
553
|
|
|
$consolidated_ancestors_branches, |
554
|
|
|
'indi_branch_consolidated', |
555
|
|
|
function (JoinClause $join) use ($gen): void { |
556
|
|
|
$join->where('maj_sosa.majs_gedcom_id', '=', $this->tree->id()) |
557
|
|
|
->where('maj_sosa.majs_user_id', '=', $this->user->id()) |
558
|
|
|
->where('branches', '>', 0) |
559
|
|
|
->whereRaw('majs_sosa = POW(2, ? - 1) + branches - 1', [$gen]); |
560
|
|
|
} |
561
|
|
|
) |
562
|
|
|
->select(['branches', 'majs_i_id']) |
563
|
|
|
->selectRaw('COUNT(i_id) AS count_indi') |
564
|
|
|
->groupBy(['branches', 'majs_i_id']) |
565
|
|
|
->get()->keyBy('branches'); |
566
|
|
|
} |
567
|
|
|
} |
568
|
|
|
|