16fd01894SGreg Roach<?php 26fd01894SGreg Roach 36fd01894SGreg Roach/** 46fd01894SGreg Roach * webtrees: online genealogy 5*d11be702SGreg Roach * Copyright (C) 2023 webtrees development team 66fd01894SGreg Roach * This program is free software: you can redistribute it and/or modify 76fd01894SGreg Roach * it under the terms of the GNU General Public License as published by 86fd01894SGreg Roach * the Free Software Foundation, either version 3 of the License, or 96fd01894SGreg Roach * (at your option) any later version. 106fd01894SGreg Roach * This program is distributed in the hope that it will be useful, 116fd01894SGreg Roach * but WITHOUT ANY WARRANTY; without even the implied warranty of 126fd01894SGreg Roach * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 136fd01894SGreg Roach * GNU General Public License for more details. 146fd01894SGreg Roach * You should have received a copy of the GNU General Public License 1589f7189bSGreg Roach * along with this program. If not, see <https://www.gnu.org/licenses/>. 166fd01894SGreg Roach */ 176fd01894SGreg Roach 186fd01894SGreg Roachdeclare(strict_types=1); 196fd01894SGreg Roach 206fd01894SGreg Roachnamespace Fisharebest\Webtrees\Services; 216fd01894SGreg Roach 221c6adce8SGreg Roachuse Fisharebest\Webtrees\Encodings\UTF8; 236fd01894SGreg Roachuse Fisharebest\Webtrees\Family; 246fd01894SGreg Roachuse Fisharebest\Webtrees\GedcomRecord; 256fd01894SGreg Roachuse Fisharebest\Webtrees\Header; 266fd01894SGreg Roachuse Fisharebest\Webtrees\I18N; 276fd01894SGreg Roachuse Fisharebest\Webtrees\Individual; 286fd01894SGreg Roachuse Fisharebest\Webtrees\Media; 29f0c88a96SGreg Roachuse Fisharebest\Webtrees\Registry; 306fd01894SGreg Roachuse Fisharebest\Webtrees\Site; 316fd01894SGreg Roachuse Fisharebest\Webtrees\Source; 326fd01894SGreg Roachuse Fisharebest\Webtrees\Tree; 336fd01894SGreg Roachuse Illuminate\Database\Capsule\Manager as DB; 346fd01894SGreg Roachuse Illuminate\Database\Query\Expression; 356fd01894SGreg Roachuse Illuminate\Database\Query\JoinClause; 366fd01894SGreg Roachuse Illuminate\Support\Collection; 37f7cf8a15SGreg Roachuse League\Flysystem\FilesystemException; 38f7cf8a15SGreg Roachuse League\Flysystem\FilesystemOperator; 39f7cf8a15SGreg Roachuse League\Flysystem\StorageAttributes; 406fd01894SGreg Roach 416fd01894SGreg Roachuse function array_map; 426fd01894SGreg Roachuse function explode; 436fd01894SGreg Roachuse function fclose; 446fd01894SGreg Roachuse function fread; 456fd01894SGreg Roachuse function preg_match; 466fd01894SGreg Roach 476fd01894SGreg Roach/** 486fd01894SGreg Roach * Utilities for the control panel. 496fd01894SGreg Roach */ 506fd01894SGreg Roachclass AdminService 516fd01894SGreg Roach{ 526fd01894SGreg Roach /** 536fd01894SGreg Roach * Count of XREFs used by two trees at the same time. 546fd01894SGreg Roach * 556fd01894SGreg Roach * @param Tree $tree1 566fd01894SGreg Roach * @param Tree $tree2 576fd01894SGreg Roach * 586fd01894SGreg Roach * @return int 596fd01894SGreg Roach */ 606fd01894SGreg Roach public function countCommonXrefs(Tree $tree1, Tree $tree2): int 616fd01894SGreg Roach { 626fd01894SGreg Roach $subquery1 = DB::table('individuals') 636fd01894SGreg Roach ->where('i_file', '=', $tree1->id()) 646fd01894SGreg Roach ->select(['i_id AS xref']) 656fd01894SGreg Roach ->union(DB::table('families') 666fd01894SGreg Roach ->where('f_file', '=', $tree1->id()) 676fd01894SGreg Roach ->select(['f_id AS xref'])) 686fd01894SGreg Roach ->union(DB::table('sources') 696fd01894SGreg Roach ->where('s_file', '=', $tree1->id()) 706fd01894SGreg Roach ->select(['s_id AS xref'])) 716fd01894SGreg Roach ->union(DB::table('media') 726fd01894SGreg Roach ->where('m_file', '=', $tree1->id()) 736fd01894SGreg Roach ->select(['m_id AS xref'])) 746fd01894SGreg Roach ->union(DB::table('other') 756fd01894SGreg Roach ->where('o_file', '=', $tree1->id()) 766fd01894SGreg Roach ->whereNotIn('o_type', [Header::RECORD_TYPE, 'TRLR']) 776fd01894SGreg Roach ->select(['o_id AS xref'])); 786fd01894SGreg Roach 796fd01894SGreg Roach $subquery2 = DB::table('change') 806fd01894SGreg Roach ->where('gedcom_id', '=', $tree2->id()) 816fd01894SGreg Roach ->select(['xref AS other_xref']) 826fd01894SGreg Roach ->union(DB::table('individuals') 836fd01894SGreg Roach ->where('i_file', '=', $tree2->id()) 846fd01894SGreg Roach ->select(['i_id AS xref'])) 856fd01894SGreg Roach ->union(DB::table('families') 866fd01894SGreg Roach ->where('f_file', '=', $tree2->id()) 876fd01894SGreg Roach ->select(['f_id AS xref'])) 886fd01894SGreg Roach ->union(DB::table('sources') 896fd01894SGreg Roach ->where('s_file', '=', $tree2->id()) 906fd01894SGreg Roach ->select(['s_id AS xref'])) 916fd01894SGreg Roach ->union(DB::table('media') 926fd01894SGreg Roach ->where('m_file', '=', $tree2->id()) 936fd01894SGreg Roach ->select(['m_id AS xref'])) 946fd01894SGreg Roach ->union(DB::table('other') 956fd01894SGreg Roach ->where('o_file', '=', $tree2->id()) 966fd01894SGreg Roach ->whereNotIn('o_type', [Header::RECORD_TYPE, 'TRLR']) 976fd01894SGreg Roach ->select(['o_id AS xref'])); 986fd01894SGreg Roach 996fd01894SGreg Roach return DB::table(new Expression('(' . $subquery1->toSql() . ') AS sub1')) 1006fd01894SGreg Roach ->mergeBindings($subquery1) 1016fd01894SGreg Roach ->joinSub($subquery2, 'sub2', 'other_xref', '=', 'xref') 1026fd01894SGreg Roach ->count(); 1036fd01894SGreg Roach } 1046fd01894SGreg Roach 1056fd01894SGreg Roach /** 1066fd01894SGreg Roach * @param Tree $tree 1076fd01894SGreg Roach * 1087c2c99faSGreg Roach * @return array<string,array<int,array<int,GedcomRecord>>> 1096fd01894SGreg Roach */ 1106fd01894SGreg Roach public function duplicateRecords(Tree $tree): array 1116fd01894SGreg Roach { 1126fd01894SGreg Roach // We can't do any reasonable checks using MySQL. 1136fd01894SGreg Roach // Will need to wait for a "repositories" table. 1146fd01894SGreg Roach $repositories = []; 1156fd01894SGreg Roach 1166fd01894SGreg Roach $sources = DB::table('sources') 1176fd01894SGreg Roach ->where('s_file', '=', $tree->id()) 1186fd01894SGreg Roach ->groupBy(['s_name']) 1196fd01894SGreg Roach ->having(new Expression('COUNT(s_id)'), '>', '1') 1206fd01894SGreg Roach ->select([new Expression('GROUP_CONCAT(s_id) AS xrefs')]) 12192ae7c02SGreg Roach ->orderBy('xrefs') 1226fd01894SGreg Roach ->pluck('xrefs') 1236fd01894SGreg Roach ->map(static function (string $xrefs) use ($tree): array { 1246fd01894SGreg Roach return array_map(static function (string $xref) use ($tree): Source { 1256b9cb339SGreg Roach return Registry::sourceFactory()->make($xref, $tree); 1266fd01894SGreg Roach }, explode(',', $xrefs)); 1276fd01894SGreg Roach }) 1286fd01894SGreg Roach ->all(); 1296fd01894SGreg Roach 1306fd01894SGreg Roach $individuals = DB::table('dates') 1316fd01894SGreg Roach ->join('name', static function (JoinClause $join): void { 1326fd01894SGreg Roach $join 1336fd01894SGreg Roach ->on('d_file', '=', 'n_file') 1346fd01894SGreg Roach ->on('d_gid', '=', 'n_id'); 1356fd01894SGreg Roach }) 1366fd01894SGreg Roach ->where('d_file', '=', $tree->id()) 1376fd01894SGreg Roach ->whereIn('d_fact', ['BIRT', 'CHR', 'BAPM', 'DEAT', 'BURI']) 1386fd01894SGreg Roach ->groupBy(['d_year', 'd_month', 'd_day', 'd_type', 'd_fact', 'n_type', 'n_full']) 1396fd01894SGreg Roach ->having(new Expression('COUNT(DISTINCT d_gid)'), '>', '1') 1406fd01894SGreg Roach ->select([new Expression('GROUP_CONCAT(DISTINCT d_gid ORDER BY d_gid) AS xrefs')]) 1416fd01894SGreg Roach ->distinct() 14292ae7c02SGreg Roach ->orderBy('xrefs') 1436fd01894SGreg Roach ->pluck('xrefs') 1446fd01894SGreg Roach ->map(static function (string $xrefs) use ($tree): array { 1456fd01894SGreg Roach return array_map(static function (string $xref) use ($tree): Individual { 1466b9cb339SGreg Roach return Registry::individualFactory()->make($xref, $tree); 1476fd01894SGreg Roach }, explode(',', $xrefs)); 1486fd01894SGreg Roach }) 1496fd01894SGreg Roach ->all(); 1506fd01894SGreg Roach 1516fd01894SGreg Roach $families = DB::table('families') 1526fd01894SGreg Roach ->where('f_file', '=', $tree->id()) 1536fd01894SGreg Roach ->groupBy([new Expression('LEAST(f_husb, f_wife)')]) 1546fd01894SGreg Roach ->groupBy([new Expression('GREATEST(f_husb, f_wife)')]) 1556fd01894SGreg Roach ->having(new Expression('COUNT(f_id)'), '>', '1') 1566fd01894SGreg Roach ->select([new Expression('GROUP_CONCAT(f_id) AS xrefs')]) 15792ae7c02SGreg Roach ->orderBy('xrefs') 1586fd01894SGreg Roach ->pluck('xrefs') 1596fd01894SGreg Roach ->map(static function (string $xrefs) use ($tree): array { 1606fd01894SGreg Roach return array_map(static function (string $xref) use ($tree): Family { 1616b9cb339SGreg Roach return Registry::familyFactory()->make($xref, $tree); 1626fd01894SGreg Roach }, explode(',', $xrefs)); 1636fd01894SGreg Roach }) 1646fd01894SGreg Roach ->all(); 1656fd01894SGreg Roach 1666fd01894SGreg Roach $media = DB::table('media_file') 1676fd01894SGreg Roach ->where('m_file', '=', $tree->id()) 1686fd01894SGreg Roach ->where('descriptive_title', '<>', '') 1696fd01894SGreg Roach ->groupBy(['descriptive_title']) 170f48369e0SGreg Roach ->having(new Expression('COUNT(DISTINCT m_id)'), '>', '1') 1716fd01894SGreg Roach ->select([new Expression('GROUP_CONCAT(m_id) AS xrefs')]) 17292ae7c02SGreg Roach ->orderBy('xrefs') 1736fd01894SGreg Roach ->pluck('xrefs') 1746fd01894SGreg Roach ->map(static function (string $xrefs) use ($tree): array { 1756fd01894SGreg Roach return array_map(static function (string $xref) use ($tree): Media { 1766b9cb339SGreg Roach return Registry::mediaFactory()->make($xref, $tree); 1776fd01894SGreg Roach }, explode(',', $xrefs)); 1786fd01894SGreg Roach }) 1796fd01894SGreg Roach ->all(); 1806fd01894SGreg Roach 1816fd01894SGreg Roach return [ 1826fd01894SGreg Roach I18N::translate('Repositories') => $repositories, 1836fd01894SGreg Roach I18N::translate('Sources') => $sources, 1846fd01894SGreg Roach I18N::translate('Individuals') => $individuals, 1856fd01894SGreg Roach I18N::translate('Families') => $families, 1866fd01894SGreg Roach I18N::translate('Media objects') => $media, 1876fd01894SGreg Roach ]; 1886fd01894SGreg Roach } 1896fd01894SGreg Roach 1906fd01894SGreg Roach /** 1916fd01894SGreg Roach * Every XREF used by this tree and also used by some other tree 1926fd01894SGreg Roach * 1936fd01894SGreg Roach * @param Tree $tree 1946fd01894SGreg Roach * 19524f2a3afSGreg Roach * @return array<string> 1966fd01894SGreg Roach */ 1976fd01894SGreg Roach public function duplicateXrefs(Tree $tree): array 1986fd01894SGreg Roach { 1996fd01894SGreg Roach $subquery1 = DB::table('individuals') 2006fd01894SGreg Roach ->where('i_file', '=', $tree->id()) 2016fd01894SGreg Roach ->select(['i_id AS xref', new Expression("'INDI' AS type")]) 2026fd01894SGreg Roach ->union(DB::table('families') 2036fd01894SGreg Roach ->where('f_file', '=', $tree->id()) 2046fd01894SGreg Roach ->select(['f_id AS xref', new Expression("'FAM' AS type")])) 2056fd01894SGreg Roach ->union(DB::table('sources') 2066fd01894SGreg Roach ->where('s_file', '=', $tree->id()) 2076fd01894SGreg Roach ->select(['s_id AS xref', new Expression("'SOUR' AS type")])) 2086fd01894SGreg Roach ->union(DB::table('media') 2096fd01894SGreg Roach ->where('m_file', '=', $tree->id()) 2106fd01894SGreg Roach ->select(['m_id AS xref', new Expression("'OBJE' AS type")])) 2116fd01894SGreg Roach ->union(DB::table('other') 2126fd01894SGreg Roach ->where('o_file', '=', $tree->id()) 2136fd01894SGreg Roach ->whereNotIn('o_type', [Header::RECORD_TYPE, 'TRLR']) 2146fd01894SGreg Roach ->select(['o_id AS xref', 'o_type AS type'])); 2156fd01894SGreg Roach 2166fd01894SGreg Roach $subquery2 = DB::table('change') 2176fd01894SGreg Roach ->where('gedcom_id', '<>', $tree->id()) 2186fd01894SGreg Roach ->select(['xref AS other_xref']) 2196fd01894SGreg Roach ->union(DB::table('individuals') 2206fd01894SGreg Roach ->where('i_file', '<>', $tree->id()) 2216fd01894SGreg Roach ->select(['i_id AS xref'])) 2226fd01894SGreg Roach ->union(DB::table('families') 2236fd01894SGreg Roach ->where('f_file', '<>', $tree->id()) 2246fd01894SGreg Roach ->select(['f_id AS xref'])) 2256fd01894SGreg Roach ->union(DB::table('sources') 2266fd01894SGreg Roach ->where('s_file', '<>', $tree->id()) 2276fd01894SGreg Roach ->select(['s_id AS xref'])) 2286fd01894SGreg Roach ->union(DB::table('media') 2296fd01894SGreg Roach ->where('m_file', '<>', $tree->id()) 2306fd01894SGreg Roach ->select(['m_id AS xref'])) 2316fd01894SGreg Roach ->union(DB::table('other') 2326fd01894SGreg Roach ->where('o_file', '<>', $tree->id()) 2336fd01894SGreg Roach ->whereNotIn('o_type', [Header::RECORD_TYPE, 'TRLR']) 2346fd01894SGreg Roach ->select(['o_id AS xref'])); 2356fd01894SGreg Roach 2369b80d2d9SGreg Roach return DB::query() 2379b80d2d9SGreg Roach ->fromSub($subquery1, 'sub1') 2386fd01894SGreg Roach ->joinSub($subquery2, 'sub2', 'other_xref', '=', 'xref') 2396fd01894SGreg Roach ->pluck('type', 'xref') 2406fd01894SGreg Roach ->all(); 2416fd01894SGreg Roach } 2426fd01894SGreg Roach 2436fd01894SGreg Roach /** 2446fd01894SGreg Roach * A list of GEDCOM files in the data folder. 2456fd01894SGreg Roach * 246f7cf8a15SGreg Roach * @param FilesystemOperator $filesystem 2476fd01894SGreg Roach * 24836779af1SGreg Roach * @return Collection<int,string> 2496fd01894SGreg Roach */ 250f7cf8a15SGreg Roach public function gedcomFiles(FilesystemOperator $filesystem): Collection 2516fd01894SGreg Roach { 252f0448b68SGreg Roach try { 253f7cf8a15SGreg Roach $files = $filesystem->listContents('') 254f7cf8a15SGreg Roach ->filter(static function (StorageAttributes $attributes) use ($filesystem) { 255f7cf8a15SGreg Roach if (!$attributes->isFile()) { 2566fd01894SGreg Roach return false; 2576fd01894SGreg Roach } 2586fd01894SGreg Roach 259f7cf8a15SGreg Roach $stream = $filesystem->readStream($attributes->path()); 2606fd01894SGreg Roach 2616fd01894SGreg Roach $header = fread($stream, 10); 2626fd01894SGreg Roach fclose($stream); 2636fd01894SGreg Roach 2641c6adce8SGreg Roach return preg_match('/^(' . UTF8::BYTE_ORDER_MARK . ')?0 HEAD/', $header) > 0; 2656fd01894SGreg Roach }) 266f7cf8a15SGreg Roach ->map(function (StorageAttributes $attributes) { 267f7cf8a15SGreg Roach return $attributes->path(); 2686fd01894SGreg Roach }) 269f7cf8a15SGreg Roach ->toArray(); 27028d026adSGreg Roach } catch (FilesystemException) { 271f0448b68SGreg Roach $files = []; 272f0448b68SGreg Roach } 273f7cf8a15SGreg Roach 274f7cf8a15SGreg Roach return Collection::make($files)->sort(); 2756fd01894SGreg Roach } 2766fd01894SGreg Roach 2776fd01894SGreg Roach /** 2786fd01894SGreg Roach * Change the behaviour a little, when there are a lot of trees. 2796fd01894SGreg Roach * 2806fd01894SGreg Roach * @return int 2816fd01894SGreg Roach */ 2826fd01894SGreg Roach public function multipleTreeThreshold(): int 2836fd01894SGreg Roach { 2848a07c98eSGreg Roach return (int) Site::getPreference('MULTIPLE_TREE_THRESHOLD'); 2856fd01894SGreg Roach } 2866fd01894SGreg Roach} 287