xref: /webtrees/app/Services/SearchService.php (revision 1792ff1cf1956b41f3e3c853cfb279a803a71ed2)
1<?php
2
3/**
4 * webtrees: online genealogy
5 * Copyright (C) 2019 webtrees development team
6 * This program is free software: you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License as published by
8 * the Free Software Foundation, either version 3 of the License, or
9 * (at your option) any later version.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program. If not, see <http://www.gnu.org/licenses/>.
16 */
17
18declare(strict_types=1);
19
20namespace Fisharebest\Webtrees\Services;
21
22use Closure;
23use Fisharebest\Webtrees\Date;
24use Fisharebest\Webtrees\Exceptions\HttpServiceUnavailableException;
25use Fisharebest\Webtrees\Family;
26use Fisharebest\Webtrees\Gedcom;
27use Fisharebest\Webtrees\GedcomRecord;
28use Fisharebest\Webtrees\I18N;
29use Fisharebest\Webtrees\Individual;
30use Fisharebest\Webtrees\Media;
31use Fisharebest\Webtrees\Note;
32use Fisharebest\Webtrees\Place;
33use Fisharebest\Webtrees\Repository;
34use Fisharebest\Webtrees\Soundex;
35use Fisharebest\Webtrees\Source;
36use Fisharebest\Webtrees\Submitter;
37use Fisharebest\Webtrees\Tree;
38use Illuminate\Database\Capsule\Manager as DB;
39use Illuminate\Database\Query\Builder;
40use Illuminate\Database\Query\Expression;
41use Illuminate\Database\Query\JoinClause;
42use Illuminate\Support\Collection;
43use stdClass;
44
45use function mb_stripos;
46
47/**
48 * Search trees for genealogy records.
49 */
50class SearchService
51{
52    /** @var TreeService */
53    private $tree_service;
54
55    /**
56     * SearchService constructor.
57     *
58     * @param TreeService $tree_service
59     */
60    public function __construct(TreeService $tree_service)
61    {
62        $this->tree_service = $tree_service;
63    }
64
65    /**
66     * @param Tree[]   $trees
67     * @param string[] $search
68     *
69     * @return Collection<Family>
70     */
71    public function searchFamilies(array $trees, array $search): Collection
72    {
73        $query = DB::table('families');
74
75        $this->whereTrees($query, 'f_file', $trees);
76        $this->whereSearch($query, 'f_gedcom', $search);
77
78        return $query
79            ->get()
80            ->each($this->rowLimiter())
81            ->map($this->familyRowMapper())
82            ->filter(GedcomRecord::accessFilter())
83            ->filter($this->rawGedcomFilter($search));
84    }
85
86    /**
87     * Search for families by name.
88     *
89     * @param Tree[]   $trees
90     * @param string[] $search
91     * @param int      $offset
92     * @param int      $limit
93     *
94     * @return Collection<Family>
95     */
96    public function searchFamilyNames(array $trees, array $search, int $offset = 0, int $limit = PHP_INT_MAX): Collection
97    {
98        $query = DB::table('families')
99            ->leftJoin('name AS husb_name', static function (JoinClause $join): void {
100                $join
101                    ->on('husb_name.n_file', '=', 'families.f_file')
102                    ->on('husb_name.n_id', '=', 'families.f_husb')
103                    ->where('husb_name.n_type', '<>', '_MARNM');
104            })
105            ->leftJoin('name AS wife_name', static function (JoinClause $join): void {
106                $join
107                    ->on('wife_name.n_file', '=', 'families.f_file')
108                    ->on('wife_name.n_id', '=', 'families.f_wife')
109                    ->where('wife_name.n_type', '<>', '_MARNM');
110            });
111
112        $prefix = DB::connection()->getTablePrefix();
113        $field  = new Expression('COALESCE(' . $prefix . "husb_name.n_full, '') || COALESCE(" . $prefix . "wife_name.n_full, '')");
114
115        $this->whereTrees($query, 'f_file', $trees);
116        $this->whereSearch($query, $field, $search);
117
118        $query
119            ->orderBy('husb_name.n_sort')
120            ->orderBy('wife_name.n_sort')
121            ->select(['families.*', 'husb_name.n_sort', 'wife_name.n_sort'])
122            ->distinct();
123
124        return $this->paginateQuery($query, $this->familyRowMapper(), GedcomRecord::accessFilter(), $offset, $limit);
125    }
126
127    /**
128     * @param Tree[]   $trees
129     * @param string[] $search
130     *
131     * @return Collection<Individual>
132     */
133    public function searchIndividuals(array $trees, array $search): Collection
134    {
135        $query = DB::table('individuals');
136
137        $this->whereTrees($query, 'i_file', $trees);
138        $this->whereSearch($query, 'i_gedcom', $search);
139
140        return $query
141            ->get()
142            ->each($this->rowLimiter())
143            ->map($this->individualRowMapper())
144            ->filter(GedcomRecord::accessFilter())
145            ->filter($this->rawGedcomFilter($search));
146    }
147
148    /**
149     * Search for individuals by name.
150     *
151     * @param Tree[]   $trees
152     * @param string[] $search
153     * @param int      $offset
154     * @param int      $limit
155     *
156     * @return Collection<Individual>
157     */
158    public function searchIndividualNames(array $trees, array $search, int $offset = 0, int $limit = PHP_INT_MAX): Collection
159    {
160        $query = DB::table('individuals')
161            ->join('name', static function (JoinClause $join): void {
162                $join
163                    ->on('name.n_file', '=', 'individuals.i_file')
164                    ->on('name.n_id', '=', 'individuals.i_id');
165            })
166            ->orderBy('n_sort')
167            ->distinct()
168            ->select(['individuals.*', 'n_sort']);
169
170        $this->whereTrees($query, 'i_file', $trees);
171        $this->whereSearch($query, 'n_full', $search);
172
173        return $this->paginateQuery($query, $this->individualRowMapper(), GedcomRecord::accessFilter(), $offset, $limit);
174    }
175
176    /**
177     * Search for media objects.
178     *
179     * @param Tree[]   $trees
180     * @param string[] $search
181     * @param int      $offset
182     * @param int      $limit
183     *
184     * @return Collection<Media>
185     */
186    public function searchMedia(array $trees, array $search, int $offset = 0, int $limit = PHP_INT_MAX): Collection
187    {
188        $query = DB::table('media');
189
190        $this->whereTrees($query, 'media.m_file', $trees);
191        $this->whereSearch($query, 'm_gedcom', $search);
192
193        return $this->paginateQuery($query, $this->mediaRowMapper(), GedcomRecord::accessFilter(), $offset, $limit);
194    }
195
196    /**
197     * Search for notes.
198     *
199     * @param Tree[]   $trees
200     * @param string[] $search
201     * @param int      $offset
202     * @param int      $limit
203     *
204     * @return Collection<Note>
205     */
206    public function searchNotes(array $trees, array $search, int $offset = 0, int $limit = PHP_INT_MAX): Collection
207    {
208        $query = DB::table('other')
209            ->where('o_type', '=', 'NOTE');
210
211        $this->whereTrees($query, 'o_file', $trees);
212        $this->whereSearch($query, 'o_gedcom', $search);
213
214        return $this->paginateQuery($query, $this->noteRowMapper(), GedcomRecord::accessFilter(), $offset, $limit);
215    }
216
217    /**
218     * Search for repositories.
219     *
220     * @param Tree[]   $trees
221     * @param string[] $search
222     * @param int      $offset
223     * @param int      $limit
224     *
225     * @return Collection<Repository>
226     */
227    public function searchRepositories(array $trees, array $search, int $offset = 0, int $limit = PHP_INT_MAX): Collection
228    {
229        $query = DB::table('other')
230            ->where('o_type', '=', 'REPO');
231
232        $this->whereTrees($query, 'o_file', $trees);
233        $this->whereSearch($query, 'o_gedcom', $search);
234
235        return $this->paginateQuery($query, $this->repositoryRowMapper(), GedcomRecord::accessFilter(), $offset, $limit);
236    }
237
238    /**
239     * Search for sources.
240     *
241     * @param Tree[]   $trees
242     * @param string[] $search
243     * @param int      $offset
244     * @param int      $limit
245     *
246     * @return Collection<Source>
247     */
248    public function searchSources(array $trees, array $search, int $offset = 0, int $limit = PHP_INT_MAX): Collection
249    {
250        $query = DB::table('sources');
251
252        $this->whereTrees($query, 's_file', $trees);
253        $this->whereSearch($query, 's_gedcom', $search);
254
255        return $this->paginateQuery($query, $this->sourceRowMapper(), GedcomRecord::accessFilter(), $offset, $limit);
256    }
257
258    /**
259     * Search for sources by name.
260     *
261     * @param Tree[]   $trees
262     * @param string[] $search
263     * @param int      $offset
264     * @param int      $limit
265     *
266     * @return Collection<Source>
267     */
268    public function searchSourcesByName(array $trees, array $search, int $offset = 0, int $limit = PHP_INT_MAX): Collection
269    {
270        $query = DB::table('sources')
271            ->orderBy('s_name');
272
273        $this->whereTrees($query, 's_file', $trees);
274        $this->whereSearch($query, 's_name', $search);
275
276        return $this->paginateQuery($query, $this->sourceRowMapper(), GedcomRecord::accessFilter(), $offset, $limit);
277    }
278
279    /**
280     * Search for submitters.
281     *
282     * @param Tree[]   $trees
283     * @param string[] $search
284     * @param int      $offset
285     * @param int      $limit
286     *
287     * @return Collection<Submitter>
288     */
289    public function searchSubmitters(array $trees, array $search, int $offset = 0, int $limit = PHP_INT_MAX): Collection
290    {
291        $query = DB::table('other')
292            ->where('o_type', '=', 'SUBM');
293
294        $this->whereTrees($query, 'o_file', $trees);
295        $this->whereSearch($query, 'o_gedcom', $search);
296
297        return $this->paginateQuery($query, $this->submitterRowMapper(), GedcomRecord::accessFilter(), $offset, $limit);
298    }
299
300    /**
301     * Search for places.
302     *
303     * @param Tree   $tree
304     * @param string $search
305     * @param int    $offset
306     * @param int    $limit
307     *
308     * @return Collection<Place>
309     */
310    public function searchPlaces(Tree $tree, string $search, int $offset = 0, int $limit = PHP_INT_MAX): Collection
311    {
312        $query = DB::table('places AS p0')
313            ->where('p0.p_file', '=', $tree->id())
314            ->leftJoin('places AS p1', 'p1.p_id', '=', 'p0.p_parent_id')
315            ->leftJoin('places AS p2', 'p2.p_id', '=', 'p1.p_parent_id')
316            ->leftJoin('places AS p3', 'p3.p_id', '=', 'p2.p_parent_id')
317            ->leftJoin('places AS p4', 'p4.p_id', '=', 'p3.p_parent_id')
318            ->leftJoin('places AS p5', 'p5.p_id', '=', 'p4.p_parent_id')
319            ->leftJoin('places AS p6', 'p6.p_id', '=', 'p5.p_parent_id')
320            ->leftJoin('places AS p7', 'p7.p_id', '=', 'p6.p_parent_id')
321            ->leftJoin('places AS p8', 'p8.p_id', '=', 'p7.p_parent_id')
322            ->orderBy('p0.p_place')
323            ->orderBy('p1.p_place')
324            ->orderBy('p2.p_place')
325            ->orderBy('p3.p_place')
326            ->orderBy('p4.p_place')
327            ->orderBy('p5.p_place')
328            ->orderBy('p6.p_place')
329            ->orderBy('p7.p_place')
330            ->orderBy('p8.p_place')
331            ->select([
332                'p0.p_place AS place0',
333                'p1.p_place AS place1',
334                'p2.p_place AS place2',
335                'p3.p_place AS place3',
336                'p4.p_place AS place4',
337                'p5.p_place AS place5',
338                'p6.p_place AS place6',
339                'p7.p_place AS place7',
340                'p8.p_place AS place8',
341            ]);
342
343        // Filter each level of the hierarchy.
344        foreach (explode(',', $search, 9) as $level => $string) {
345            $query->whereContains('p' . $level . '.p_place', $string);
346        }
347
348        $row_mapper = static function (stdClass $row) use ($tree): Place {
349            $place = implode(', ', array_filter((array) $row));
350
351            return new Place($place, $tree);
352        };
353
354        $filter = static function (): bool {
355            return true;
356        };
357
358        return $this->paginateQuery($query, $row_mapper, $filter, $offset, $limit);
359    }
360
361    /**
362     * @param Tree[]   $trees
363     * @param string[] $fields
364     * @param string[] $modifiers
365     *
366     * @return Collection<Individual>
367     */
368    public function searchIndividualsAdvanced(array $trees, array $fields, array $modifiers): Collection
369    {
370        $fields = array_filter($fields);
371
372        $query = DB::table('individuals')
373            ->select(['individuals.*'])
374            ->distinct();
375
376        $this->whereTrees($query, 'i_file', $trees);
377
378        // Join the following tables
379        $father_name   = false;
380        $mother_name   = false;
381        $spouse_family = false;
382        $indi_name     = false;
383        $indi_date     = false;
384        $fam_date      = false;
385        $indi_plac     = false;
386        $fam_plac      = false;
387
388        foreach ($fields as $field_name => $field_value) {
389            if ($field_value !== '') {
390                if (substr($field_name, 0, 14) === 'FAMC:HUSB:NAME') {
391                    $father_name = true;
392                } elseif (substr($field_name, 0, 14) === 'FAMC:WIFE:NAME') {
393                    $mother_name = true;
394                } elseif (substr($field_name, 0, 4) === 'NAME') {
395                    $indi_name = true;
396                } elseif (strpos($field_name, ':DATE') !== false) {
397                    if (substr($field_name, 0, 4) === 'FAMS') {
398                        $fam_date      = true;
399                        $spouse_family = true;
400                    } else {
401                        $indi_date = true;
402                    }
403                } elseif (strpos($field_name, ':PLAC') !== false) {
404                    if (substr($field_name, 0, 4) === 'FAMS') {
405                        $fam_plac      = true;
406                        $spouse_family = true;
407                    } else {
408                        $indi_plac = true;
409                    }
410                } elseif ($field_name === 'FAMS:NOTE') {
411                    $spouse_family = true;
412                }
413            }
414        }
415
416        if ($father_name || $mother_name) {
417            $query->join('link AS l1', static function (JoinClause $join): void {
418                $join
419                    ->on('l1.l_file', '=', 'individuals.i_file')
420                    ->on('l1.l_from', '=', 'individuals.i_id')
421                    ->where('l1.l_type', '=', 'FAMC');
422            });
423
424            if ($father_name) {
425                $query->join('link AS l2', static function (JoinClause $join): void {
426                    $join
427                        ->on('l2.l_file', '=', 'l1.l_file')
428                        ->on('l2.l_from', '=', 'l1.l_to')
429                        ->where('l2.l_type', '=', 'HUSB');
430                });
431                $query->join('name AS father_name', static function (JoinClause $join): void {
432                    $join
433                        ->on('father_name.n_file', '=', 'l2.l_file')
434                        ->on('father_name.n_id', '=', 'l2.l_to');
435                });
436            }
437
438            if ($mother_name) {
439                $query->join('link AS l3', static function (JoinClause $join): void {
440                    $join
441                        ->on('l3.l_file', '=', 'l1.l_file')
442                        ->on('l3.l_from', '=', 'l1.l_to')
443                        ->where('l3.l_type', '=', 'WIFE');
444                });
445                $query->join('name AS mother_name', static function (JoinClause $join): void {
446                    $join
447                        ->on('mother_name.n_file', '=', 'l3.l_file')
448                        ->on('mother_name.n_id', '=', 'l3.l_to');
449                });
450            }
451        }
452
453        if ($spouse_family) {
454            $query->join('link AS l4', static function (JoinClause $join): void {
455                $join
456                    ->on('l4.l_file', '=', 'individuals.i_file')
457                    ->on('l4.l_from', '=', 'individuals.i_id')
458                    ->where('l4.l_type', '=', 'FAMS');
459            });
460            $query->join('families AS spouse_families', static function (JoinClause $join): void {
461                $join
462                    ->on('spouse_families.f_file', '=', 'l4.l_file')
463                    ->on('spouse_families.f_id', '=', 'l4.l_to');
464            });
465        }
466
467        if ($indi_name) {
468            $query->join('name AS individual_name', static function (JoinClause $join): void {
469                $join
470                    ->on('individual_name.n_file', '=', 'individuals.i_file')
471                    ->on('individual_name.n_id', '=', 'individuals.i_id');
472            });
473        }
474
475        if ($indi_date) {
476            $query->join('dates AS individual_dates', static function (JoinClause $join): void {
477                $join
478                    ->on('individual_dates.d_file', '=', 'individuals.i_file')
479                    ->on('individual_dates.d_gid', '=', 'individuals.i_id');
480            });
481        }
482
483        if ($fam_date) {
484            $query->join('dates AS family_dates', static function (JoinClause $join): void {
485                $join
486                    ->on('family_dates.d_file', '=', 'spouse_families.f_file')
487                    ->on('family_dates.d_gid', '=', 'spouse_families.f_id');
488            });
489        }
490
491        if ($indi_plac) {
492            $query->join('placelinks AS individual_placelinks', static function (JoinClause $join): void {
493                $join
494                    ->on('individual_placelinks.pl_file', '=', 'individuals.i_file')
495                    ->on('individual_placelinks.pl_gid', '=', 'individuals.i_id');
496            });
497            $query->join('places AS individual_places', static function (JoinClause $join): void {
498                $join
499                    ->on('individual_places.p_file', '=', 'individual_placelinks.pl_file')
500                    ->on('individual_places.p_id', '=', 'individual_placelinks.pl_p_id');
501            });
502        }
503
504        if ($fam_plac) {
505            $query->join('placelinks AS familyl_placelinks', static function (JoinClause $join): void {
506                $join
507                    ->on('familyl_placelinks.pl_file', '=', 'individuals.i_file')
508                    ->on('familyl_placelinks.pl_gid', '=', 'individuals.i_id');
509            });
510            $query->join('places AS family_places', static function (JoinClause $join): void {
511                $join
512                    ->on('family_places.p_file', '=', 'familyl_placelinks.pl_file')
513                    ->on('family_places.p_id', '=', 'familyl_placelinks.pl_p_id');
514            });
515        }
516
517        foreach ($fields as $field_name => $field_value) {
518            $parts = explode(':', $field_name . '::::');
519            if ($parts[0] === 'NAME') {
520                // NAME:*
521                switch ($parts[1]) {
522                    case 'GIVN':
523                        switch ($modifiers[$field_name]) {
524                            case 'EXACT':
525                                $query->where('individual_name.n_givn', '=', $field_value);
526                                break;
527                            case 'BEGINS':
528                                $query->where('individual_name.n_givn', 'LIKE', $field_value . '%');
529                                break;
530                            case 'CONTAINS':
531                                $query->where('individual_name.n_givn', 'LIKE', '%' . $field_value . '%');
532                                break;
533                            case 'SDX_STD':
534                                $sdx = Soundex::russell($field_value);
535                                if ($sdx !== '') {
536                                    $this->wherePhonetic($query, 'individual_name.n_soundex_givn_std', $sdx);
537                                } else {
538                                    // No phonetic content? Use a substring match
539                                    $query->where('individual_name.n_givn', 'LIKE', '%' . $field_value . '%');
540                                }
541                                break;
542                            case 'SDX': // SDX uses DM by default.
543                            case 'SDX_DM':
544                                $sdx = Soundex::daitchMokotoff($field_value);
545                                if ($sdx !== '') {
546                                    $this->wherePhonetic($query, 'individual_name.n_soundex_givn_dm', $sdx);
547                                } else {
548                                    // No phonetic content? Use a substring match
549                                    $query->where('individual_name.n_givn', 'LIKE', '%' . $field_value . '%');
550                                }
551                                break;
552                        }
553                        break;
554                    case 'SURN':
555                        switch ($modifiers[$field_name]) {
556                            case 'EXACT':
557                                $query->where('individual_name.n_surn', '=', $field_value);
558                                break;
559                            case 'BEGINS':
560                                $query->where('individual_name.n_surn', 'LIKE', $field_value . '%');
561                                break;
562                            case 'CONTAINS':
563                                $query->where('individual_name.n_surn', 'LIKE', '%' . $field_value . '%');
564                                break;
565                            case 'SDX_STD':
566                                $sdx = Soundex::russell($field_value);
567                                if ($sdx !== '') {
568                                    $this->wherePhonetic($query, 'individual_name.n_soundex_surn_std', $sdx);
569                                } else {
570                                    // No phonetic content? Use a substring match
571                                    $query->where('individual_name.n_surn', 'LIKE', '%' . $field_value . '%');
572                                }
573                                break;
574                            case 'SDX': // SDX uses DM by default.
575                            case 'SDX_DM':
576                                $sdx = Soundex::daitchMokotoff($field_value);
577                                if ($sdx !== '') {
578                                    $this->wherePhonetic($query, 'individual_name.n_soundex_surn_dm', $sdx);
579                                } else {
580                                    // No phonetic content? Use a substring match
581                                    $query->where('individual_name.n_surn', 'LIKE', '%' . $field_value . '%');
582                                }
583                                break;
584                        }
585                        break;
586                    case 'NICK':
587                    case '_MARNM':
588                    case '_HEB':
589                    case '_AKA':
590                        $query
591                            ->where('individual_name', '=', $parts[1])
592                            ->where('individual_name', 'LIKE', '%' . $field_value . '%');
593                        break;
594                }
595                unset($fields[$field_name]);
596            } elseif ($parts[1] === 'DATE') {
597                // *:DATE
598                $date = new Date($field_value);
599                if ($date->isOK()) {
600                    $delta = 365 * ($modifiers[$field_name] ?? 0);
601                    $query
602                        ->where('individual_dates.d_fact', '=', $parts[0])
603                        ->where('individual_dates.d_julianday1', '>=', $date->minimumJulianDay() - $delta)
604                        ->where('individual_dates.d_julianday2', '<=', $date->minimumJulianDay() + $delta);
605                }
606                unset($fields[$field_name]);
607            } elseif ($parts[0] === 'FAMS' && $parts[2] === 'DATE') {
608                // FAMS:*:DATE
609                $date = new Date($field_value);
610                if ($date->isOK()) {
611                    $delta = 365 * $modifiers[$field_name];
612                    $query
613                        ->where('family_dates.d_fact', '=', $parts[1])
614                        ->where('family_dates.d_julianday1', '>=', $date->minimumJulianDay() - $delta)
615                        ->where('family_dates.d_julianday2', '<=', $date->minimumJulianDay() + $delta);
616                }
617                unset($fields[$field_name]);
618            } elseif ($parts[1] === 'PLAC') {
619                // *:PLAC
620                // SQL can only link a place to a person/family, not to an event.
621                $query->where('individual_places.p_place', 'LIKE', '%' . $field_value . '%');
622            } elseif ($parts[0] === 'FAMS' && $parts[2] === 'PLAC') {
623                // FAMS:*:PLAC
624                // SQL can only link a place to a person/family, not to an event.
625                $query->where('family_places.p_place', 'LIKE', '%' . $field_value . '%');
626            } elseif ($parts[0] === 'FAMC' && $parts[2] === 'NAME') {
627                $table = $parts[1] === 'HUSB' ? 'father_name' : 'mother_name';
628                // NAME:*
629                switch ($parts[3]) {
630                    case 'GIVN':
631                        switch ($modifiers[$field_name]) {
632                            case 'EXACT':
633                                $query->where($table . '.n_givn', '=', $field_value);
634                                break;
635                            case 'BEGINS':
636                                $query->where($table . '.n_givn', 'LIKE', $field_value . '%');
637                                break;
638                            case 'CONTAINS':
639                                $query->where($table . '.n_givn', 'LIKE', '%' . $field_value . '%');
640                                break;
641                            case 'SDX_STD':
642                                $sdx = Soundex::russell($field_value);
643                                if ($sdx !== '') {
644                                    $this->wherePhonetic($query, $table . '.n_soundex_givn_std', $sdx);
645                                } else {
646                                    // No phonetic content? Use a substring match
647                                    $query->where($table . '.n_givn', 'LIKE', '%' . $field_value . '%');
648                                }
649                                break;
650                            case 'SDX': // SDX uses DM by default.
651                            case 'SDX_DM':
652                                $sdx = Soundex::daitchMokotoff($field_value);
653                                if ($sdx !== '') {
654                                    $this->wherePhonetic($query, $table . '.n_soundex_givn_dm', $sdx);
655                                } else {
656                                    // No phonetic content? Use a substring match
657                                    $query->where($table . '.n_givn', 'LIKE', '%' . $field_value . '%');
658                                }
659                                break;
660                        }
661                        break;
662                    case 'SURN':
663                        switch ($modifiers[$field_name]) {
664                            case 'EXACT':
665                                $query->where($table . '.n_surn', '=', $field_value);
666                                break;
667                            case 'BEGINS':
668                                $query->where($table . '.n_surn', 'LIKE', $field_value . '%');
669                                break;
670                            case 'CONTAINS':
671                                $query->where($table . '.n_surn', 'LIKE', '%' . $field_value . '%');
672                                break;
673                            case 'SDX_STD':
674                                $sdx = Soundex::russell($field_value);
675                                if ($sdx !== '') {
676                                    $this->wherePhonetic($query, $table . '.n_soundex_surn_std', $sdx);
677                                } else {
678                                    // No phonetic content? Use a substring match
679                                    $query->where($table . '.n_surn', 'LIKE', '%' . $field_value . '%');
680                                }
681                                break;
682                            case 'SDX': // SDX uses DM by default.
683                            case 'SDX_DM':
684                                $sdx = Soundex::daitchMokotoff($field_value);
685                                if ($sdx !== '') {
686                                    $this->wherePhonetic($query, $table . '.n_soundex_surn_dm', $sdx);
687                                } else {
688                                    // No phonetic content? Use a substring match
689                                    $query->where($table . '.n_surn', 'LIKE', '%' . $field_value . '%');
690                                }
691                                break;
692                        }
693                        break;
694                }
695                unset($fields[$field_name]);
696            } elseif ($parts[0] === 'FAMS') {
697                // e.g. searches for occupation, religion, note, etc.
698                // Initial matching only.  Need PHP to apply filter.
699                $query->where('spouse_families.f_gedcom', 'LIKE', "%\n1 " . $parts[1] . ' %' . $field_value . '%');
700            } elseif ($parts[1] === 'TYPE') {
701                // e.g. FACT:TYPE or EVEN:TYPE
702                // Initial matching only.  Need PHP to apply filter.
703                $query->where('individuals.i_gedcom', 'LIKE', "%\n1 " . $parts[0] . '%\n2 TYPE %' . $field_value . '%');
704            } else {
705                // e.g. searches for occupation, religion, note, etc.
706                // Initial matching only.  Need PHP to apply filter.
707                $query->where('individuals.i_gedcom', 'LIKE', "%\n1 " . $parts[0] . '%' . $parts[1] . '%' . $field_value . '%');
708            }
709        }
710        return $query
711            ->get()
712            ->each($this->rowLimiter())
713            ->map($this->individualRowMapper())
714            ->filter(GedcomRecord::accessFilter())
715            ->filter(static function (Individual $individual) use ($fields): bool {
716                // Check for searches which were only partially matched by SQL
717                foreach ($fields as $field_name => $field_value) {
718                    $regex = '/' . preg_quote($field_value, '/') . '/i';
719
720                    $parts = explode(':', $field_name . '::::');
721
722                    // *:PLAC
723                    if ($parts[1] === 'PLAC') {
724                        foreach ($individual->facts([$parts[0]]) as $fact) {
725                            if (preg_match($regex, $fact->place()->gedcomName())) {
726                                continue 2;
727                            }
728                        }
729                        return false;
730                    }
731
732                    // FAMS:*:PLAC
733                    if ($parts[0] === 'FAMS' && $parts[2] === 'PLAC') {
734                        foreach ($individual->spouseFamilies() as $family) {
735                            foreach ($family->facts([$parts[1]]) as $fact) {
736                                if (preg_match($regex, $fact->place()->gedcomName())) {
737                                    continue 2;
738                                }
739                            }
740                        }
741                        return false;
742                    }
743
744                    // e.g. searches for occupation, religion, note, etc.
745                    if ($parts[0] === 'FAMS') {
746                        foreach ($individual->spouseFamilies() as $family) {
747                            foreach ($family->facts([$parts[1]]) as $fact) {
748                                if (preg_match($regex, $fact->value())) {
749                                    continue 3;
750                                }
751                            }
752                        }
753                        return false;
754                    }
755
756                    // e.g. FACT:TYPE or EVEN:TYPE
757                    if ($parts[1] === 'TYPE' || $parts[1] === '_WT_USER') {
758                        foreach ($individual->facts([$parts[0]]) as $fact) {
759                            if (preg_match($regex, $fact->attribute($parts[1]))) {
760                                continue 2;
761                            }
762                        }
763
764                        return false;
765                    }
766                }
767
768                return true;
769            });
770    }
771
772    /**
773     * @param string $soundex
774     * @param string $lastname
775     * @param string $firstname
776     * @param string $place
777     * @param Tree[] $search_trees
778     *
779     * @return Collection<Individual>
780     */
781    public function searchIndividualsPhonetic(string $soundex, string $lastname, string $firstname, string $place, array $search_trees): Collection
782    {
783        switch ($soundex) {
784            default:
785            case 'Russell':
786                $givn_sdx   = Soundex::russell($firstname);
787                $surn_sdx   = Soundex::russell($lastname);
788                $plac_sdx   = Soundex::russell($place);
789                $givn_field = 'n_soundex_givn_std';
790                $surn_field = 'n_soundex_surn_std';
791                $plac_field = 'p_std_soundex';
792                break;
793            case 'DaitchM':
794                $givn_sdx   = Soundex::daitchMokotoff($firstname);
795                $surn_sdx   = Soundex::daitchMokotoff($lastname);
796                $plac_sdx   = Soundex::daitchMokotoff($place);
797                $givn_field = 'n_soundex_givn_dm';
798                $surn_field = 'n_soundex_surn_dm';
799                $plac_field = 'p_dm_soundex';
800                break;
801        }
802
803        // Nothing to search for? Return nothing.
804        if ($givn_sdx === '' && $surn_sdx === '' && $plac_sdx === '') {
805            return new Collection();
806        }
807
808        $query = DB::table('individuals')
809            ->select(['individuals.*'])
810            ->distinct();
811
812        $this->whereTrees($query, 'i_file', $search_trees);
813
814        if ($plac_sdx !== '') {
815            $query->join('placelinks', static function (JoinClause $join): void {
816                $join
817                    ->on('placelinks.pl_file', '=', 'individuals.i_file')
818                    ->on('placelinks.pl_gid', '=', 'individuals.i_id');
819            });
820            $query->join('places', static function (JoinClause $join): void {
821                $join
822                    ->on('places.p_file', '=', 'placelinks.pl_file')
823                    ->on('places.p_id', '=', 'placelinks.pl_p_id');
824            });
825
826            $this->wherePhonetic($query, $plac_field, $plac_sdx);
827        }
828
829        if ($givn_sdx !== '' || $surn_sdx !== '') {
830            $query->join('name', static function (JoinClause $join): void {
831                $join
832                    ->on('name.n_file', '=', 'individuals.i_file')
833                    ->on('name.n_id', '=', 'individuals.i_id');
834            });
835
836            $this->wherePhonetic($query, $givn_field, $givn_sdx);
837            $this->wherePhonetic($query, $surn_field, $surn_sdx);
838        }
839
840        return $query
841            ->get()
842            ->each($this->rowLimiter())
843            ->map($this->individualRowMapper())
844            ->filter(GedcomRecord::accessFilter());
845    }
846
847    /**
848     * Paginate a search query.
849     *
850     * @param Builder $query      Searches the database for the desired records.
851     * @param Closure $row_mapper Converts a row from the query into a record.
852     * @param Closure $row_filter
853     * @param int     $offset     Skip this many rows.
854     * @param int     $limit      Take this many rows.
855     *
856     * @return Collection<mixed>
857     */
858    private function paginateQuery(Builder $query, Closure $row_mapper, Closure $row_filter, int $offset, int $limit): Collection
859    {
860        $collection = new Collection();
861
862        foreach ($query->cursor() as $row) {
863            $record = $row_mapper($row);
864            // If the object has a method "canShow()", then use it to filter for privacy.
865            if ($row_filter($record)) {
866                if ($offset > 0) {
867                    $offset--;
868                } else {
869                    if ($limit > 0) {
870                        $collection->push($record);
871                    }
872
873                    $limit--;
874
875                    if ($limit === 0) {
876                        break;
877                    }
878                }
879            }
880        }
881
882
883        return $collection;
884    }
885
886    /**
887     * Apply search filters to a SQL query column.  Apply collation rules to MySQL.
888     *
889     * @param Builder           $query
890     * @param Expression|string $field
891     * @param string[]          $search_terms
892     */
893    private function whereSearch(Builder $query, $field, array $search_terms): void
894    {
895        if ($field instanceof Expression) {
896            $field = $field->getValue();
897        }
898
899        foreach ($search_terms as $search_term) {
900            $query->whereContains(new Expression($field), $search_term);
901        }
902    }
903
904    /**
905     * Apply soundex search filters to a SQL query column.
906     *
907     * @param Builder           $query
908     * @param Expression|string $field
909     * @param string            $soundex
910     */
911    private function wherePhonetic(Builder $query, $field, string $soundex): void
912    {
913        if ($soundex !== '') {
914            $query->where(static function (Builder $query) use ($soundex, $field): void {
915                foreach (explode(':', $soundex) as $sdx) {
916                    $query->orWhere($field, 'LIKE', '%' . $sdx . '%');
917                }
918            });
919        }
920    }
921
922    /**
923     * @param Builder $query
924     * @param string  $tree_id_field
925     * @param Tree[]  $trees
926     */
927    private function whereTrees(Builder $query, string $tree_id_field, array $trees): void
928    {
929        $tree_ids = array_map(static function (Tree $tree): int {
930            return $tree->id();
931        }, $trees);
932
933        $query->whereIn($tree_id_field, $tree_ids);
934    }
935
936
937    /**
938     * Find the media object that uses a particular media file.
939     *
940     * @param string $file
941     *
942     * @return Media[]
943     */
944    public function findMediaObjectsForMediaFile(string $file): array
945    {
946        return DB::table('media')
947            ->join('media_file', static function (JoinClause $join): void {
948                $join
949                    ->on('media_file.m_file', '=', 'media.m_file')
950                    ->on('media_file.m_id', '=', 'media.m_id');
951            })
952            ->join('gedcom_setting', 'media.m_file', '=', 'gedcom_setting.gedcom_id')
953            ->where(new Expression('setting_value || multimedia_file_refn'), '=', $file)
954            ->select(['media.*'])
955            ->distinct()
956            ->get()
957            ->map($this->mediaRowMapper())
958            ->all();
959    }
960
961    /**
962     * A closure to filter records by privacy-filtered GEDCOM data.
963     *
964     * @param array $search_terms
965     *
966     * @return Closure
967     */
968    private function rawGedcomFilter(array $search_terms): Closure
969    {
970        return static function (GedcomRecord $record) use ($search_terms): bool {
971            // Ignore non-genealogy fields
972            $gedcom = preg_replace('/\n\d (?:_UID|_WT_USER) .*/', '', $record->gedcom());
973
974            // Ignore matches in links
975            $gedcom = preg_replace('/\n\d ' . Gedcom::REGEX_TAG . '( @' . Gedcom::REGEX_XREF . '@)?/', '', $gedcom);
976
977            // Re-apply the filtering
978            foreach ($search_terms as $search_term) {
979                if (mb_stripos($gedcom, $search_term) === false) {
980                    return false;
981                }
982            }
983
984            return true;
985        };
986    }
987
988    /**
989     * Searching for short or common text can give more results than the system can process.
990     *
991     * @param int $limit
992     *
993     * @return Closure
994     */
995    private function rowLimiter(int $limit = 1000): Closure
996    {
997        return static function () use ($limit): void {
998            static $n = 0;
999
1000            if (++$n > $limit) {
1001                $message = I18N::translate('The search returned too many results.');
1002
1003                throw new HttpServiceUnavailableException($message);
1004            }
1005        };
1006    }
1007
1008    /**
1009     * Convert a row from any tree in the families table into a family object.
1010     *
1011     * @return Closure
1012     */
1013    private function familyRowMapper(): Closure
1014    {
1015        return function (stdClass $row): Family {
1016            $tree = $this->tree_service->find((int) $row->f_file);
1017
1018            return Family::getInstance($row->f_id, $tree, $row->f_gedcom);
1019        };
1020    }
1021
1022    /**
1023     * Convert a row from any tree in the individuals table into an individual object.
1024     *
1025     * @return Closure
1026     */
1027    private function individualRowMapper(): Closure
1028    {
1029        return function (stdClass $row): Individual {
1030            $tree = $this->tree_service->find((int) $row->i_file);
1031
1032            return Individual::getInstance($row->i_id, $tree, $row->i_gedcom);
1033        };
1034    }
1035
1036    /**
1037     * Convert a row from any tree in the media table into an media object.
1038     *
1039     * @return Closure
1040     */
1041    private function mediaRowMapper(): Closure
1042    {
1043        return function (stdClass $row): Media {
1044            $tree = $this->tree_service->find((int) $row->m_file);
1045
1046            return Media::getInstance($row->m_id, $tree, $row->m_gedcom);
1047        };
1048    }
1049
1050    /**
1051     * Convert a row from any tree in the other table into a note object.
1052     *
1053     * @return Closure
1054     */
1055    private function noteRowMapper(): Closure
1056    {
1057        return function (stdClass $row): Note {
1058            $tree = $this->tree_service->find((int) $row->o_file);
1059
1060            return Note::getInstance($row->o_id, $tree, $row->o_gedcom);
1061        };
1062    }
1063
1064    /**
1065     * Convert a row from any tree in the other table into a repository object.
1066     *
1067     * @return Closure
1068     */
1069    private function repositoryRowMapper(): Closure
1070    {
1071        return function (stdClass $row): Repository {
1072            $tree = $this->tree_service->find((int) $row->o_file);
1073
1074            return Repository::getInstance($row->o_id, $tree, $row->o_gedcom);
1075        };
1076    }
1077
1078    /**
1079     * Convert a row from any tree in the sources table into a source object.
1080     *
1081     * @return Closure
1082     */
1083    private function sourceRowMapper(): Closure
1084    {
1085        return function (stdClass $row): Source {
1086            $tree = $this->tree_service->find((int) $row->s_file);
1087
1088            return Source::getInstance($row->s_id, $tree, $row->s_gedcom);
1089        };
1090    }
1091
1092    /**
1093     * Convert a row from any tree in the other table into a submitter object.
1094     *
1095     * @return Closure
1096     */
1097    private function submitterRowMapper(): Closure
1098    {
1099        return function (stdClass $row): GedcomRecord {
1100            $tree = $this->tree_service->find((int) $row->o_file);
1101
1102            return GedcomRecord::getInstance($row->o_id, $tree, $row->o_gedcom);
1103        };
1104    }
1105}
1106