1<?php 2 3/** 4 * webtrees: online genealogy 5 * Copyright (C) 2021 webtrees development team 6 * This program is free software: you can redistribute it and/or modify 7 * it under the terms of the GNU General Public License as published by 8 * the Free Software Foundation, either version 3 of the License, or 9 * (at your option) any later version. 10 * This program is distributed in the hope that it will be useful, 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 13 * GNU General Public License for more details. 14 * You should have received a copy of the GNU General Public License 15 * along with this program. If not, see <https://www.gnu.org/licenses/>. 16 */ 17 18declare(strict_types=1); 19 20namespace Fisharebest\Webtrees\Services; 21 22use Fisharebest\Webtrees\FlashMessages; 23use Fisharebest\Webtrees\I18N; 24use Fisharebest\Webtrees\Registry; 25use Fisharebest\Webtrees\Tree; 26use Illuminate\Database\Capsule\Manager as DB; 27use Illuminate\Database\Query\Expression; 28use Illuminate\Database\Query\JoinClause; 29use Illuminate\Support\Collection; 30use InvalidArgumentException; 31use League\Flysystem\Filesystem; 32use League\Flysystem\FilesystemException; 33use League\Flysystem\FilesystemOperator; 34use League\Flysystem\StorageAttributes; 35use Psr\Http\Message\ServerRequestInterface; 36use Psr\Http\Message\UploadedFileInterface; 37use RuntimeException; 38 39use function array_combine; 40use function array_diff; 41use function assert; 42use function dirname; 43use function ini_get; 44use function intdiv; 45use function min; 46use function pathinfo; 47use function preg_replace; 48use function sha1; 49use function sort; 50use function str_contains; 51use function str_ends_with; 52use function str_starts_with; 53use function strtolower; 54use function strtr; 55use function substr; 56use function trim; 57 58use const PATHINFO_EXTENSION; 59use const UPLOAD_ERR_OK; 60 61/** 62 * Managing media files. 63 */ 64class MediaFileService 65{ 66 public const EDIT_RESTRICTIONS = [ 67 'locked', 68 ]; 69 70 public const PRIVACY_RESTRICTIONS = [ 71 'none', 72 'privacy', 73 'confidential', 74 ]; 75 76 public const EXTENSION_TO_FORM = [ 77 'jpeg' => 'jpg', 78 'tiff' => 'tif', 79 ]; 80 81 private const IGNORE_FOLDERS = [ 82 // Old versions of webtrees 83 'thumbs', 84 'watermarks', 85 // Windows 86 'Thumbs.db', 87 // Synology 88 '@eaDir', 89 // QNAP, 90 '.@__thumb', 91 ]; 92 93 /** 94 * What is the largest file a user may upload? 95 */ 96 public function maxUploadFilesize(): string 97 { 98 $sizePostMax = $this->parseIniFileSize(ini_get('post_max_size')); 99 $sizeUploadMax = $this->parseIniFileSize(ini_get('upload_max_filesize')); 100 101 $bytes = min($sizePostMax, $sizeUploadMax); 102 $kb = intdiv($bytes + 1023, 1024); 103 104 return I18N::translate('%s KB', I18N::number($kb)); 105 } 106 107 /** 108 * Returns the given size from an ini value in bytes. 109 * 110 * @param string $size 111 * 112 * @return int 113 */ 114 private function parseIniFileSize(string $size): int 115 { 116 $number = (int) $size; 117 118 switch (substr($size, -1)) { 119 case 'g': 120 case 'G': 121 return $number * 1073741824; 122 case 'm': 123 case 'M': 124 return $number * 1048576; 125 case 'k': 126 case 'K': 127 return $number * 1024; 128 default: 129 return $number; 130 } 131 } 132 133 /** 134 * A list of media files not already linked to a media object. 135 * 136 * @param Tree $tree 137 * @param FilesystemOperator $data_filesystem 138 * 139 * @return array<string> 140 */ 141 public function unusedFiles(Tree $tree, FilesystemOperator $data_filesystem): array 142 { 143 $used_files = DB::table('media_file') 144 ->where('m_file', '=', $tree->id()) 145 ->where('multimedia_file_refn', 'NOT LIKE', 'http://%') 146 ->where('multimedia_file_refn', 'NOT LIKE', 'https://%') 147 ->pluck('multimedia_file_refn') 148 ->all(); 149 150 $media_filesystem = $tree->mediaFilesystem($data_filesystem); 151 $disk_files = $this->allFilesOnDisk($media_filesystem, '', Filesystem::LIST_DEEP)->all(); 152 $unused_files = array_diff($disk_files, $used_files); 153 154 sort($unused_files); 155 156 return array_combine($unused_files, $unused_files); 157 } 158 159 /** 160 * Store an uploaded file (or URL), either to be added to a media object 161 * or to create a media object. 162 * 163 * @param ServerRequestInterface $request 164 * 165 * @return string The value to be stored in the 'FILE' field of the media object. 166 * @throws FilesystemException 167 */ 168 public function uploadFile(ServerRequestInterface $request): string 169 { 170 $tree = $request->getAttribute('tree'); 171 assert($tree instanceof Tree); 172 173 $data_filesystem = Registry::filesystem()->data(); 174 175 $params = (array) $request->getParsedBody(); 176 $file_location = $params['file_location']; 177 178 switch ($file_location) { 179 case 'url': 180 $remote = $params['remote']; 181 182 if (str_contains($remote, '://')) { 183 return $remote; 184 } 185 186 return ''; 187 188 case 'unused': 189 $unused = $params['unused']; 190 191 if ($tree->mediaFilesystem($data_filesystem)->fileExists($unused)) { 192 return $unused; 193 } 194 195 return ''; 196 197 case 'upload': 198 default: 199 $folder = $params['folder']; 200 $auto = $params['auto']; 201 $new_file = $params['new_file']; 202 203 /** @var UploadedFileInterface|null $uploaded_file */ 204 $uploaded_file = $request->getUploadedFiles()['file']; 205 if ($uploaded_file === null || $uploaded_file->getError() !== UPLOAD_ERR_OK) { 206 return ''; 207 } 208 209 // The filename 210 $new_file = strtr($new_file, ['\\' => '/']); 211 if ($new_file !== '' && !str_contains($new_file, '/')) { 212 $file = $new_file; 213 } else { 214 $file = $uploaded_file->getClientFilename(); 215 } 216 217 // The folder 218 $folder = strtr($folder, ['\\' => '/']); 219 $folder = trim($folder, '/'); 220 if ($folder !== '') { 221 $folder .= '/'; 222 } 223 224 // Generate a unique name for the file? 225 if ($auto === '1' || $tree->mediaFilesystem($data_filesystem)->fileExists($folder . $file)) { 226 $folder = ''; 227 $extension = pathinfo($uploaded_file->getClientFilename(), PATHINFO_EXTENSION); 228 $file = sha1((string) $uploaded_file->getStream()) . '.' . $extension; 229 } 230 231 try { 232 $tree->mediaFilesystem($data_filesystem)->writeStream($folder . $file, $uploaded_file->getStream()->detach()); 233 234 return $folder . $file; 235 } catch (RuntimeException | InvalidArgumentException $ex) { 236 FlashMessages::addMessage(I18N::translate('There was an error uploading your file.')); 237 238 return ''; 239 } 240 } 241 } 242 243 /** 244 * Convert the media file attributes into GEDCOM format. 245 * 246 * @param string $file 247 * @param string $type 248 * @param string $title 249 * @param string $note 250 * 251 * @return string 252 */ 253 public function createMediaFileGedcom(string $file, string $type, string $title, string $note): string 254 { 255 // Tidy non-printing characters 256 $type = trim(preg_replace('/\s+/', ' ', $type)); 257 $title = trim(preg_replace('/\s+/', ' ', $title)); 258 259 $gedcom = '1 FILE ' . $file; 260 261 $format = strtolower(pathinfo($file, PATHINFO_EXTENSION)); 262 $format = self::EXTENSION_TO_FORM[$format] ?? $format; 263 264 if ($format !== '') { 265 $gedcom .= "\n2 FORM " . $format; 266 } elseif ($type !== '') { 267 $gedcom .= "\n2 FORM"; 268 } 269 270 if ($type !== '') { 271 $gedcom .= "\n3 TYPE " . $type; 272 } 273 274 if ($title !== '') { 275 $gedcom .= "\n2 TITL " . $title; 276 } 277 278 if ($note !== '') { 279 // Convert HTML line endings to GEDCOM continuations 280 $gedcom .= "\n1 NOTE " . strtr($note, ["\r\n" => "\n2 CONT "]); 281 } 282 283 return $gedcom; 284 } 285 286 /** 287 * Fetch a list of all files on disk (in folders used by any tree). 288 * 289 * @param FilesystemOperator $filesystem $filesystem to search 290 * @param string $folder Root folder 291 * @param bool $subfolders Include subfolders 292 * 293 * @return Collection<string> 294 */ 295 public function allFilesOnDisk(FilesystemOperator $filesystem, string $folder, bool $subfolders): Collection 296 { 297 try { 298 $files = $filesystem->listContents($folder, $subfolders) 299 ->filter(function (StorageAttributes $attributes): bool { 300 return $attributes->isFile() && !$this->ignorePath($attributes->path()); 301 }) 302 ->map(static function (StorageAttributes $attributes): string { 303 return $attributes->path(); 304 }) 305 ->toArray(); 306 } catch (FilesystemException $ex) { 307 $files = []; 308 } 309 310 return new Collection($files); 311 } 312 313 /** 314 * Fetch a list of all files on in the database. 315 * 316 * @param string $media_folder Root folder 317 * @param bool $subfolders Include subfolders 318 * 319 * @return Collection<string> 320 */ 321 public function allFilesInDatabase(string $media_folder, bool $subfolders): Collection 322 { 323 $query = DB::table('media_file') 324 ->join('gedcom_setting', 'gedcom_id', '=', 'm_file') 325 ->where('setting_name', '=', 'MEDIA_DIRECTORY') 326 //->where('multimedia_file_refn', 'LIKE', '%/%') 327 ->where('multimedia_file_refn', 'NOT LIKE', 'http://%') 328 ->where('multimedia_file_refn', 'NOT LIKE', 'https://%') 329 ->where(new Expression('setting_value || multimedia_file_refn'), 'LIKE', $media_folder . '%') 330 ->select(new Expression('setting_value || multimedia_file_refn AS path')) 331 ->orderBy(new Expression('setting_value || multimedia_file_refn')); 332 333 if (!$subfolders) { 334 $query->where(new Expression('setting_value || multimedia_file_refn'), 'NOT LIKE', $media_folder . '%/%'); 335 } 336 337 return $query->pluck('path'); 338 } 339 340 /** 341 * Generate a list of all folders in either the database or the filesystem. 342 * 343 * @param FilesystemOperator $data_filesystem 344 * 345 * @return Collection<string,string> 346 * @throws FilesystemException 347 */ 348 public function allMediaFolders(FilesystemOperator $data_filesystem): Collection 349 { 350 $db_folders = DB::table('media_file') 351 ->leftJoin('gedcom_setting', static function (JoinClause $join): void { 352 $join 353 ->on('gedcom_id', '=', 'm_file') 354 ->where('setting_name', '=', 'MEDIA_DIRECTORY'); 355 }) 356 ->where('multimedia_file_refn', 'NOT LIKE', 'http://%') 357 ->where('multimedia_file_refn', 'NOT LIKE', 'https://%') 358 ->select(new Expression("COALESCE(setting_value, 'media/') || multimedia_file_refn AS path")) 359 ->pluck('path') 360 ->map(static function (string $path): string { 361 return dirname($path) . '/'; 362 }); 363 364 $media_roots = DB::table('gedcom') 365 ->leftJoin('gedcom_setting', static function (JoinClause $join): void { 366 $join 367 ->on('gedcom.gedcom_id', '=', 'gedcom_setting.gedcom_id') 368 ->where('setting_name', '=', 'MEDIA_DIRECTORY'); 369 }) 370 ->where('gedcom.gedcom_id', '>', '0') 371 ->pluck(new Expression("COALESCE(setting_value, 'media/')")) 372 ->uniqueStrict(); 373 374 $disk_folders = new Collection($media_roots); 375 376 foreach ($media_roots as $media_folder) { 377 $tmp = $data_filesystem->listContents($media_folder, Filesystem::LIST_DEEP) 378 ->filter(function (StorageAttributes $attributes): bool { 379 return $attributes->isDir() && !$this->ignorePath($attributes->path()); 380 }) 381 ->map(static function (StorageAttributes $attributes): string { 382 return $attributes->path() . '/'; 383 }) 384 ->toArray(); 385 386 $disk_folders = $disk_folders->concat($tmp); 387 } 388 389 return $disk_folders->concat($db_folders) 390 ->uniqueStrict() 391 ->mapWithKeys(static function (string $folder): array { 392 return [$folder => $folder]; 393 }); 394 } 395 396 /** 397 * Ignore certain media folders. 398 * 399 * @param string $path 400 * 401 * @return bool 402 */ 403 private function ignorePath(string $path): bool 404 { 405 foreach (explode('/', $path) as $part) { 406 if (in_array($part, self::IGNORE_FOLDERS, true)) { 407 return true; 408 } 409 } 410 411 return false; 412 } 413} 414