xref: /webtrees/app/Module/SiteMapModule.php (revision 0422c1fe06810b05ea48309b1f3ae558fb2153d0)
18c2e8227SGreg Roach<?php
28c2e8227SGreg Roach/**
38c2e8227SGreg Roach * webtrees: online genealogy
48fcd0d32SGreg Roach * Copyright (C) 2019 webtrees development team
58c2e8227SGreg Roach * This program is free software: you can redistribute it and/or modify
68c2e8227SGreg Roach * it under the terms of the GNU General Public License as published by
78c2e8227SGreg Roach * the Free Software Foundation, either version 3 of the License, or
88c2e8227SGreg Roach * (at your option) any later version.
98c2e8227SGreg Roach * This program is distributed in the hope that it will be useful,
108c2e8227SGreg Roach * but WITHOUT ANY WARRANTY; without even the implied warranty of
118c2e8227SGreg Roach * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
128c2e8227SGreg Roach * GNU General Public License for more details.
138c2e8227SGreg Roach * You should have received a copy of the GNU General Public License
148c2e8227SGreg Roach * along with this program. If not, see <http://www.gnu.org/licenses/>.
158c2e8227SGreg Roach */
16e7f56f2aSGreg Roachdeclare(strict_types=1);
17e7f56f2aSGreg Roach
1876692c8bSGreg Roachnamespace Fisharebest\Webtrees\Module;
1976692c8bSGreg Roach
20*0422c1feSGreg Roachuse Carbon\Carbon;
21a5f7ed67SGreg Roachuse Fisharebest\Webtrees\FlashMessages;
22a5f7ed67SGreg Roachuse Fisharebest\Webtrees\GedcomRecord;
23b1b85189SGreg Roachuse Fisharebest\Webtrees\Html;
240e62c4b8SGreg Roachuse Fisharebest\Webtrees\I18N;
250e62c4b8SGreg Roachuse Fisharebest\Webtrees\Individual;
260e62c4b8SGreg Roachuse Fisharebest\Webtrees\Media;
270e62c4b8SGreg Roachuse Fisharebest\Webtrees\Note;
280e62c4b8SGreg Roachuse Fisharebest\Webtrees\Repository;
290e62c4b8SGreg Roachuse Fisharebest\Webtrees\Source;
300e62c4b8SGreg Roachuse Fisharebest\Webtrees\Tree;
31fa17fb66SGreg Roachuse Illuminate\Database\Capsule\Manager as DB;
32886b77daSGreg Roachuse Illuminate\Support\Collection;
33a5f7ed67SGreg Roachuse Symfony\Component\HttpFoundation\RedirectResponse;
34a5f7ed67SGreg Roachuse Symfony\Component\HttpFoundation\Request;
35a5f7ed67SGreg Roachuse Symfony\Component\HttpFoundation\Response;
36a5f7ed67SGreg Roachuse Symfony\Component\HttpKernel\Exception\NotFoundHttpException;
378c2e8227SGreg Roach
388c2e8227SGreg Roach/**
398c2e8227SGreg Roach * Class SiteMapModule
408c2e8227SGreg Roach */
41c1010edaSGreg Roachclass SiteMapModule extends AbstractModule implements ModuleConfigInterface
42c1010edaSGreg Roach{
4316d6367aSGreg Roach    private const RECORDS_PER_VOLUME = 500; // Keep sitemap files small, for memory, CPU and max_allowed_packet limits.
4416d6367aSGreg Roach    private const CACHE_LIFE         = 1209600; // Two weeks
458c2e8227SGreg Roach
46a5f7ed67SGreg Roach    /**
47a5f7ed67SGreg Roach     * How should this module be labelled on tabs, menus, etc.?
48a5f7ed67SGreg Roach     *
49a5f7ed67SGreg Roach     * @return string
50a5f7ed67SGreg Roach     */
518f53f488SRico Sonntag    public function getTitle(): string
52c1010edaSGreg Roach    {
53bbb76c12SGreg Roach        /* I18N: Name of a module - see http://en.wikipedia.org/wiki/Sitemaps */
54bbb76c12SGreg Roach        return I18N::translate('Sitemaps');
558c2e8227SGreg Roach    }
568c2e8227SGreg Roach
57a5f7ed67SGreg Roach    /**
58a5f7ed67SGreg Roach     * A sentence describing what this module does.
59a5f7ed67SGreg Roach     *
60a5f7ed67SGreg Roach     * @return string
61a5f7ed67SGreg Roach     */
628f53f488SRico Sonntag    public function getDescription(): string
63c1010edaSGreg Roach    {
64bbb76c12SGreg Roach        /* I18N: Description of the “Sitemaps” module */
65bbb76c12SGreg Roach        return I18N::translate('Generate sitemap files for search engines.');
668c2e8227SGreg Roach    }
678c2e8227SGreg Roach
6876692c8bSGreg Roach    /**
69a5f7ed67SGreg Roach     * The URL to a page where the user can modify the configuration of this module.
7076692c8bSGreg Roach     *
71a5f7ed67SGreg Roach     * @return string
7276692c8bSGreg Roach     */
738f53f488SRico Sonntag    public function getConfigLink(): string
74c1010edaSGreg Roach    {
75c1010edaSGreg Roach        return route('module', [
76c1010edaSGreg Roach            'module' => $this->getName(),
77c1010edaSGreg Roach            'action' => 'Admin',
78c1010edaSGreg Roach        ]);
798c2e8227SGreg Roach    }
808c2e8227SGreg Roach
818c2e8227SGreg Roach    /**
82a5f7ed67SGreg Roach     * @return Response
838c2e8227SGreg Roach     */
8436e59714SGreg Roach    public function getAdminAction(): Response
85c1010edaSGreg Roach    {
86a5f7ed67SGreg Roach        $this->layout = 'layouts/administration';
87a5f7ed67SGreg Roach
88c1010edaSGreg Roach        $sitemap_url = route('module', [
89c1010edaSGreg Roach            'module' => 'sitemap',
90c1010edaSGreg Roach            'action' => 'Index',
91c1010edaSGreg Roach        ]);
92a5f7ed67SGreg Roach
93a5f7ed67SGreg Roach        // This list comes from http://en.wikipedia.org/wiki/Sitemaps
94a5f7ed67SGreg Roach        $submit_urls = [
95a5f7ed67SGreg Roach            'Bing/Yahoo' => Html::url('https://www.bing.com/webmaster/ping.aspx', ['siteMap' => $sitemap_url]),
96a5f7ed67SGreg Roach            'Google'     => Html::url('https://www.google.com/webmasters/tools/ping', ['sitemap' => $sitemap_url]),
97a5f7ed67SGreg Roach        ];
98a5f7ed67SGreg Roach
99291c1b19SGreg Roach        return $this->viewResponse('modules/sitemap/config', [
100a5f7ed67SGreg Roach            'all_trees'   => Tree::getAll(),
101a5f7ed67SGreg Roach            'sitemap_url' => $sitemap_url,
102a5f7ed67SGreg Roach            'submit_urls' => $submit_urls,
103a5f7ed67SGreg Roach            'title'       => $this->getTitle(),
104a5f7ed67SGreg Roach        ]);
1058c2e8227SGreg Roach    }
1068c2e8227SGreg Roach
1078c2e8227SGreg Roach    /**
108a5f7ed67SGreg Roach     * @param Request $request
109a5f7ed67SGreg Roach     *
110a5f7ed67SGreg Roach     * @return RedirectResponse
1118c2e8227SGreg Roach     */
112c1010edaSGreg Roach    public function postAdminAction(Request $request): RedirectResponse
113c1010edaSGreg Roach    {
1148c2e8227SGreg Roach        foreach (Tree::getAll() as $tree) {
11572cf66d4SGreg Roach            $include_in_sitemap = (bool) $request->get('sitemap' . $tree->id());
116a5f7ed67SGreg Roach            $tree->setPreference('include_in_sitemap', (string) $include_in_sitemap);
1178c2e8227SGreg Roach        }
118a5f7ed67SGreg Roach
119291c1b19SGreg Roach        FlashMessages::addMessage(I18N::translate('The preferences for the module “%s” have been updated.', $this->getTitle()), 'success');
120a5f7ed67SGreg Roach
121a5f7ed67SGreg Roach        return new RedirectResponse($this->getConfigLink());
1228c2e8227SGreg Roach    }
1238c2e8227SGreg Roach
1248c2e8227SGreg Roach    /**
125a5f7ed67SGreg Roach     * @return Response
1268c2e8227SGreg Roach     */
12736e59714SGreg Roach    public function getIndexAction(): Response
128c1010edaSGreg Roach    {
129a5f7ed67SGreg Roach        $timestamp = (int) $this->getPreference('sitemap.timestamp');
130a5f7ed67SGreg Roach
131*0422c1feSGreg Roach        if ($timestamp > Carbon::now()->timestamp - self::CACHE_LIFE) {
132a5f7ed67SGreg Roach            $content = $this->getPreference('sitemap.xml');
1338c2e8227SGreg Roach        } else {
134fa17fb66SGreg Roach            $count_individuals = DB::table('individuals')
135fa17fb66SGreg Roach                ->groupBy('i_file')
136fa17fb66SGreg Roach                ->select([DB::raw('COUNT(*) AS total'), 'i_file'])
137fa17fb66SGreg Roach                ->pluck('total', 'i_file');
138a5f7ed67SGreg Roach
139fa17fb66SGreg Roach            $count_media = DB::table('media')
140fa17fb66SGreg Roach                ->groupBy('m_file')
141fa17fb66SGreg Roach                ->select([DB::raw('COUNT(*) AS total'), 'm_file'])
142fa17fb66SGreg Roach                ->pluck('total', 'm_file');
143a5f7ed67SGreg Roach
144fa17fb66SGreg Roach            $count_notes = DB::table('other')
145fa17fb66SGreg Roach                ->where('o_type', '=', 'NOTE')
146fa17fb66SGreg Roach                ->groupBy('o_file')
147fa17fb66SGreg Roach                ->select([DB::raw('COUNT(*) AS total'), 'o_file'])
148fa17fb66SGreg Roach                ->pluck('total', 'o_file');
149a5f7ed67SGreg Roach
150fa17fb66SGreg Roach            $count_repositories = DB::table('other')
151fa17fb66SGreg Roach                ->where('o_type', '=', 'REPO')
152fa17fb66SGreg Roach                ->groupBy('o_file')
153fa17fb66SGreg Roach                ->select([DB::raw('COUNT(*) AS total'), 'o_file'])
154fa17fb66SGreg Roach                ->pluck('total', 'o_file');
155a5f7ed67SGreg Roach
156fa17fb66SGreg Roach            $count_sources = DB::table('sources')
157fa17fb66SGreg Roach                ->groupBy('s_file')
158fa17fb66SGreg Roach                ->select([DB::raw('COUNT(*) AS total'), 's_file'])
159fa17fb66SGreg Roach                ->pluck('total', 's_file');
160a5f7ed67SGreg Roach
161a37bbafbSGreg Roach            $content = view('modules/sitemap/sitemap-index.xml', [
162a5f7ed67SGreg Roach                'all_trees'          => Tree::getAll(),
163a5f7ed67SGreg Roach                'count_individuals'  => $count_individuals,
164a5f7ed67SGreg Roach                'count_media'        => $count_media,
165a5f7ed67SGreg Roach                'count_notes'        => $count_notes,
166a5f7ed67SGreg Roach                'count_repositories' => $count_repositories,
167a5f7ed67SGreg Roach                'count_sources'      => $count_sources,
168a5f7ed67SGreg Roach                'last_mod'           => date('Y-m-d'),
169a5f7ed67SGreg Roach                'records_per_volume' => self::RECORDS_PER_VOLUME,
170a5f7ed67SGreg Roach            ]);
171a5f7ed67SGreg Roach
172a5f7ed67SGreg Roach            $this->setPreference('sitemap.xml', $content);
173a5f7ed67SGreg Roach        }
174a5f7ed67SGreg Roach
175a5f7ed67SGreg Roach        return new Response($content, Response::HTTP_OK, [
176a5f7ed67SGreg Roach            'Content-Type' => 'application/xml',
177a5f7ed67SGreg Roach        ]);
178a5f7ed67SGreg Roach    }
179a5f7ed67SGreg Roach
180a5f7ed67SGreg Roach    /**
181a5f7ed67SGreg Roach     * @param Request $request
182a5f7ed67SGreg Roach     *
183a5f7ed67SGreg Roach     * @return Response
184a5f7ed67SGreg Roach     */
185c1010edaSGreg Roach    public function getFileAction(Request $request): Response
186c1010edaSGreg Roach    {
187a5f7ed67SGreg Roach        $file = $request->get('file', '');
188a5f7ed67SGreg Roach
189a5f7ed67SGreg Roach        if (!preg_match('/^(\d+)-([imnrs])-(\d+)$/', $file, $match)) {
190a5f7ed67SGreg Roach            throw new NotFoundHttpException('Bad sitemap file');
191a5f7ed67SGreg Roach        }
192a5f7ed67SGreg Roach
193a5f7ed67SGreg Roach        $timestamp = (int) $this->getPreference('sitemap-' . $file . '.timestamp');
194a5f7ed67SGreg Roach
195a5f7ed67SGreg Roach        if ($timestamp > WT_TIMESTAMP - self::CACHE_LIFE) {
196a5f7ed67SGreg Roach            $content = $this->getPreference('sitemap-' . $file . '.xml');
197a5f7ed67SGreg Roach        } else {
198a5f7ed67SGreg Roach            $tree = Tree::findById((int) $match[1]);
199a5f7ed67SGreg Roach
200a5f7ed67SGreg Roach            if ($tree === null) {
201a5f7ed67SGreg Roach                throw new NotFoundHttpException('No such tree');
202a5f7ed67SGreg Roach            }
203a5f7ed67SGreg Roach
204bdb3725aSGreg Roach            $records = $this->sitemapRecords($tree, $match[2], self::RECORDS_PER_VOLUME, self::RECORDS_PER_VOLUME * $match[3]);
205a5f7ed67SGreg Roach
206a37bbafbSGreg Roach            $content = view('modules/sitemap/sitemap-file.xml', ['records' => $records]);
207a5f7ed67SGreg Roach
208a5f7ed67SGreg Roach            $this->setPreference('sitemap.xml', $content);
209a5f7ed67SGreg Roach        }
210a5f7ed67SGreg Roach
211a5f7ed67SGreg Roach        return new Response($content, Response::HTTP_OK, [
212a5f7ed67SGreg Roach            'Content-Type' => 'application/xml',
213a5f7ed67SGreg Roach        ]);
214a5f7ed67SGreg Roach    }
215a5f7ed67SGreg Roach
216a5f7ed67SGreg Roach    /**
217a5f7ed67SGreg Roach     * @param Tree   $tree
218a5f7ed67SGreg Roach     * @param string $type
219a5f7ed67SGreg Roach     * @param int    $limit
220a5f7ed67SGreg Roach     * @param int    $offset
221a5f7ed67SGreg Roach     *
222886b77daSGreg Roach     * @return Collection|GedcomRecord[]
223a5f7ed67SGreg Roach     */
224886b77daSGreg Roach    private function sitemapRecords(Tree $tree, string $type, int $limit, int $offset): Collection
225c1010edaSGreg Roach    {
226a5f7ed67SGreg Roach        switch ($type) {
2278c2e8227SGreg Roach            case 'i':
228a5f7ed67SGreg Roach                $records = $this->sitemapIndividuals($tree, $limit, $offset);
229a5f7ed67SGreg Roach                break;
230a5f7ed67SGreg Roach
231a5f7ed67SGreg Roach            case 'm':
232a5f7ed67SGreg Roach                $records = $this->sitemapMedia($tree, $limit, $offset);
233a5f7ed67SGreg Roach                break;
234a5f7ed67SGreg Roach
235a5f7ed67SGreg Roach            case 'n':
236a5f7ed67SGreg Roach                $records = $this->sitemapNotes($tree, $limit, $offset);
237a5f7ed67SGreg Roach                break;
238a5f7ed67SGreg Roach
239a5f7ed67SGreg Roach            case 'r':
240a5f7ed67SGreg Roach                $records = $this->sitemapRepositories($tree, $limit, $offset);
241a5f7ed67SGreg Roach                break;
242a5f7ed67SGreg Roach
243a5f7ed67SGreg Roach            case 's':
244a5f7ed67SGreg Roach                $records = $this->sitemapSources($tree, $limit, $offset);
245a5f7ed67SGreg Roach                break;
246a5f7ed67SGreg Roach
247a5f7ed67SGreg Roach            default:
248a5f7ed67SGreg Roach                throw new NotFoundHttpException('Invalid record type: ' . $type);
249a5f7ed67SGreg Roach        }
250a5f7ed67SGreg Roach
251a5f7ed67SGreg Roach        // Skip private records.
2524146fabcSGreg Roach        $records = $records->filter(GedcomRecord::accessFilter());
253a5f7ed67SGreg Roach
254a5f7ed67SGreg Roach        return $records;
255a5f7ed67SGreg Roach    }
256a5f7ed67SGreg Roach
257a5f7ed67SGreg Roach    /**
258a5f7ed67SGreg Roach     * @param Tree $tree
259a5f7ed67SGreg Roach     * @param int  $limit
260a5f7ed67SGreg Roach     * @param int  $offset
261a5f7ed67SGreg Roach     *
262886b77daSGreg Roach     * @return Collection|Individual[]
263a5f7ed67SGreg Roach     */
264886b77daSGreg Roach    private function sitemapIndividuals(Tree $tree, int $limit, int $offset): Collection
265c1010edaSGreg Roach    {
266886b77daSGreg Roach        return DB::table('individuals')
267fa17fb66SGreg Roach            ->where('i_file', '=', $tree->id())
268fa17fb66SGreg Roach            ->orderBy('i_id')
269fa17fb66SGreg Roach            ->skip($offset)
270fa17fb66SGreg Roach            ->take($limit)
271886b77daSGreg Roach            ->get()
272c0804649SGreg Roach            ->map(Individual::rowMapper());
2738c2e8227SGreg Roach    }
274a5f7ed67SGreg Roach
275a5f7ed67SGreg Roach    /**
276a5f7ed67SGreg Roach     * @param Tree $tree
277a5f7ed67SGreg Roach     * @param int  $limit
278a5f7ed67SGreg Roach     * @param int  $offset
279a5f7ed67SGreg Roach     *
280886b77daSGreg Roach     * @return Collection|Media[]
281a5f7ed67SGreg Roach     */
282886b77daSGreg Roach    private function sitemapMedia(Tree $tree, int $limit, int $offset): Collection
283c1010edaSGreg Roach    {
284886b77daSGreg Roach        return DB::table('media')
285fa17fb66SGreg Roach            ->where('m_file', '=', $tree->id())
286fa17fb66SGreg Roach            ->orderBy('m_id')
287fa17fb66SGreg Roach            ->skip($offset)
288fa17fb66SGreg Roach            ->take($limit)
289886b77daSGreg Roach            ->get()
290c0804649SGreg Roach            ->map(Media::rowMapper());
2918c2e8227SGreg Roach    }
2928c2e8227SGreg Roach
2938c2e8227SGreg Roach    /**
294a5f7ed67SGreg Roach     * @param Tree $tree
295a5f7ed67SGreg Roach     * @param int  $limit
296a5f7ed67SGreg Roach     * @param int  $offset
297a5f7ed67SGreg Roach     *
298886b77daSGreg Roach     * @return Collection|Note[]
2998c2e8227SGreg Roach     */
300886b77daSGreg Roach    private function sitemapNotes(Tree $tree, int $limit, int $offset): Collection
301c1010edaSGreg Roach    {
302886b77daSGreg Roach        return DB::table('other')
303fa17fb66SGreg Roach            ->where('o_file', '=', $tree->id())
304fa17fb66SGreg Roach            ->where('o_type', '=', 'NOTE')
305fa17fb66SGreg Roach            ->orderBy('o_id')
306fa17fb66SGreg Roach            ->skip($offset)
307fa17fb66SGreg Roach            ->take($limit)
308886b77daSGreg Roach            ->get()
309c0804649SGreg Roach            ->map(Note::rowMapper());
3108c2e8227SGreg Roach    }
3118c2e8227SGreg Roach
312a5f7ed67SGreg Roach    /**
313a5f7ed67SGreg Roach     * @param Tree $tree
314a5f7ed67SGreg Roach     * @param int  $limit
315a5f7ed67SGreg Roach     * @param int  $offset
316a5f7ed67SGreg Roach     *
317886b77daSGreg Roach     * @return Collection|Repository[]
318a5f7ed67SGreg Roach     */
319886b77daSGreg Roach    private function sitemapRepositories(Tree $tree, int $limit, int $offset): Collection
320c1010edaSGreg Roach    {
321886b77daSGreg Roach        return DB::table('other')
322fa17fb66SGreg Roach            ->where('o_file', '=', $tree->id())
323fa17fb66SGreg Roach            ->where('o_type', '=', 'REPO')
324fa17fb66SGreg Roach            ->orderBy('o_id')
325fa17fb66SGreg Roach            ->skip($offset)
326fa17fb66SGreg Roach            ->take($limit)
327886b77daSGreg Roach            ->get()
328c0804649SGreg Roach            ->map(Repository::rowMapper());
329a5f7ed67SGreg Roach    }
330a5f7ed67SGreg Roach
331a5f7ed67SGreg Roach    /**
332a5f7ed67SGreg Roach     * @param Tree $tree
333a5f7ed67SGreg Roach     * @param int  $limit
334a5f7ed67SGreg Roach     * @param int  $offset
335a5f7ed67SGreg Roach     *
336886b77daSGreg Roach     * @return Collection|Source[]
337a5f7ed67SGreg Roach     */
338886b77daSGreg Roach    private function sitemapSources(Tree $tree, int $limit, int $offset): Collection
339c1010edaSGreg Roach    {
340886b77daSGreg Roach        return DB::table('sources')
341fa17fb66SGreg Roach            ->where('s_file', '=', $tree->id())
342fa17fb66SGreg Roach            ->orderBy('s_id')
343fa17fb66SGreg Roach            ->skip($offset)
344fa17fb66SGreg Roach            ->take($limit)
345886b77daSGreg Roach            ->get()
346c0804649SGreg Roach            ->map(Source::rowMapper());
3478c2e8227SGreg Roach    }
3488c2e8227SGreg Roach}
349