1<?php
2// This file is part of Moodle - http://moodle.org/
3//
4// Moodle is free software: you can redistribute it and/or modify
5// it under the terms of the GNU General Public License as published by
6// the Free Software Foundation, either version 3 of the License, or
7// (at your option) any later version.
8//
9// Moodle is distributed in the hope that it will be useful,
10// but WITHOUT ANY WARRANTY; without even the implied warranty of
11// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
12// GNU General Public License for more details.
13//
14// You should have received a copy of the GNU General Public License
15// along with Moodle.  If not, see <http://www.gnu.org/licenses/>.
16
17/**
18 * Implementation of .tar.gz packer.
19 *
20 * A limited subset of the .tar format is supported. This packer can open files
21 * that it wrote, but may not be able to open files from other sources,
22 * especially if they use extensions. There are restrictions on file
23 * length and character set of filenames.
24 *
25 * We generate POSIX-compliant ustar files. As a result, the following
26 * restrictions apply to archive paths:
27 *
28 * - Filename may not be more than 100 characters.
29 * - Total of path + filename may not be more than 256 characters.
30 * - For path more than 155 characters it may or may not work.
31 * - May not contain non-ASCII characters.
32 *
33 * @package core_files
34 * @copyright 2013 The Open University
35 * @license http://www.gnu.org/copyleft/gpl.html GNU GPL v3 or later
36 */
37
38defined('MOODLE_INTERNAL') || die();
39
40require_once("$CFG->libdir/filestorage/file_packer.php");
41require_once("$CFG->libdir/filestorage/tgz_extractor.php");
42
43/**
44 * Utility class - handles all packing/unpacking of .tar.gz files.
45 *
46 * @package core_files
47 * @category files
48 * @copyright 2013 The Open University
49 * @license http://www.gnu.org/copyleft/gpl.html GNU GPL v3 or later
50 */
51class tgz_packer extends file_packer {
52    /**
53     * @var int Default timestamp used where unknown (Jan 1st 2013 00:00)
54     */
55    const DEFAULT_TIMESTAMP = 1356998400;
56
57    /**
58     * @var string Name of special archive index file added by Moodle.
59     */
60    const ARCHIVE_INDEX_FILE = '.ARCHIVE_INDEX';
61
62    /**
63     * @var string Required text at start of archive index file before file count.
64     */
65    const ARCHIVE_INDEX_COUNT_PREFIX = 'Moodle archive file index. Count: ';
66
67    /**
68     * @var bool If true, includes .ARCHIVE_INDEX file in root of tar file.
69     */
70    protected $includeindex = true;
71
72    /**
73     * @var int Max value for total progress.
74     */
75    const PROGRESS_MAX = 1000000;
76
77    /**
78     * @var int Tar files have a fixed block size of 512 bytes.
79     */
80    const TAR_BLOCK_SIZE = 512;
81
82    /**
83     * Archive files and store the result in file storage.
84     *
85     * Any existing file at that location will be overwritten.
86     *
87     * @param array $files array from archive path => pathname or stored_file
88     * @param int $contextid context ID
89     * @param string $component component
90     * @param string $filearea file area
91     * @param int $itemid item ID
92     * @param string $filepath file path
93     * @param string $filename file name
94     * @param int $userid user ID
95     * @param bool $ignoreinvalidfiles true means ignore missing or invalid files, false means abort on any error
96     * @param file_progress $progress Progress indicator callback or null if not required
97     * @return stored_file|bool false if error stored_file instance if ok
98     * @throws file_exception If file operations fail
99     * @throws coding_exception If any archive paths do not meet the restrictions
100     */
101    public function archive_to_storage(array $files, $contextid,
102            $component, $filearea, $itemid, $filepath, $filename,
103            $userid = null, $ignoreinvalidfiles = true, file_progress $progress = null) {
104        global $CFG;
105
106        // Set up a temporary location for the file.
107        $tempfolder = $CFG->tempdir . '/core_files';
108        check_dir_exists($tempfolder);
109        $tempfile = tempnam($tempfolder, '.tgz');
110
111        // Archive to the given path.
112        if ($result = $this->archive_to_pathname($files, $tempfile, $ignoreinvalidfiles, $progress)) {
113            // If there is an existing file, delete it.
114            $fs = get_file_storage();
115            if ($existing = $fs->get_file($contextid, $component, $filearea, $itemid, $filepath, $filename)) {
116                $existing->delete();
117            }
118            $filerecord = array('contextid' => $contextid, 'component' => $component,
119                    'filearea' => $filearea, 'itemid' => $itemid, 'filepath' => $filepath,
120                    'filename' => $filename, 'userid' => $userid, 'mimetype' => 'application/x-tgz');
121            self::delete_existing_file_record($fs, $filerecord);
122            $result = $fs->create_file_from_pathname($filerecord, $tempfile);
123        }
124
125        // Delete the temporary file (if created) and return.
126        @unlink($tempfile);
127        return $result;
128    }
129
130    /**
131     * Wrapper function useful for deleting an existing file (if present) just
132     * before creating a new one.
133     *
134     * @param file_storage $fs File storage
135     * @param array $filerecord File record in same format used to create file
136     */
137    public static function delete_existing_file_record(file_storage $fs, array $filerecord) {
138        if ($existing = $fs->get_file($filerecord['contextid'], $filerecord['component'],
139                $filerecord['filearea'], $filerecord['itemid'], $filerecord['filepath'],
140                $filerecord['filename'])) {
141            $existing->delete();
142        }
143    }
144
145    /**
146     * By default, the .tar file includes a .ARCHIVE_INDEX file as its first
147     * entry. This makes list_files much faster and allows for better progress
148     * reporting.
149     *
150     * If you need to disable the inclusion of this file, use this function
151     * before calling one of the archive_xx functions.
152     *
153     * @param bool $includeindex If true, includes index
154     */
155    public function set_include_index($includeindex) {
156        $this->includeindex = $includeindex;
157    }
158
159    /**
160     * Archive files and store the result in an OS file.
161     *
162     * @param array $files array from archive path => pathname or stored_file
163     * @param string $archivefile path to target zip file
164     * @param bool $ignoreinvalidfiles true means ignore missing or invalid files, false means abort on any error
165     * @param file_progress $progress Progress indicator callback or null if not required
166     * @return bool true if file created, false if not
167     * @throws coding_exception If any archive paths do not meet the restrictions
168     */
169    public function archive_to_pathname(array $files, $archivefile,
170            $ignoreinvalidfiles=true, file_progress $progress = null) {
171        // Open .gz file.
172        if (!($gz = gzopen($archivefile, 'wb'))) {
173            return false;
174        }
175        try {
176            // Because we update how we calculate progress after we already
177            // analyse the directory list, we can't just use a number of files
178            // as progress. Instead, progress always goes to PROGRESS_MAX
179            // and we do estimates as a proportion of that. To begin with,
180            // assume that counting files will be 10% of the work, so allocate
181            // one-tenth of PROGRESS_MAX to the total of all files.
182            if ($files) {
183                $progressperfile = (int)(self::PROGRESS_MAX / (count($files) * 10));
184            } else {
185                // If there are no files, avoid divide by zero.
186                $progressperfile = 1;
187            }
188            $done = 0;
189
190            // Expand the provided files into a complete list of single files.
191            $expandedfiles = array();
192            foreach ($files as $archivepath => $file) {
193                // Update progress if required.
194                if ($progress) {
195                    $progress->progress($done, self::PROGRESS_MAX);
196                }
197                $done += $progressperfile;
198
199                if (is_null($file)) {
200                    // Empty directory record. Ensure it ends in a /.
201                    if (!preg_match('~/$~', $archivepath)) {
202                        $archivepath .= '/';
203                    }
204                    $expandedfiles[$archivepath] = null;
205                } else if (is_string($file)) {
206                    // File specified as path on disk.
207                    if (!$this->list_files_path($expandedfiles, $archivepath, $file,
208                            $progress, $done)) {
209                        gzclose($gz);
210                        unlink($archivefile);
211                        return false;
212                    }
213                } else if (is_array($file)) {
214                    // File specified as raw content in array.
215                    $expandedfiles[$archivepath] = $file;
216                } else {
217                    // File specified as stored_file object.
218                    $this->list_files_stored($expandedfiles, $archivepath, $file);
219                }
220            }
221
222            // Store the list of files as a special file that is first in the
223            // archive. This contains enough information to implement list_files
224            // if required later.
225            $list = self::ARCHIVE_INDEX_COUNT_PREFIX . count($expandedfiles) . "\n";
226            $sizes = array();
227            $mtimes = array();
228            foreach ($expandedfiles as $archivepath => $file) {
229                // Check archivepath doesn't contain any non-ASCII characters.
230                if (!preg_match('~^[\x00-\xff]*$~', $archivepath)) {
231                    throw new coding_exception(
232                            'Non-ASCII paths not supported: ' . $archivepath);
233                }
234
235                // Build up the details.
236                $type = 'f';
237                $mtime = '?';
238                if (is_null($file)) {
239                    $type = 'd';
240                    $size = 0;
241                } else if (is_string($file)) {
242                    $stat = stat($file);
243                    $mtime = (int)$stat['mtime'];
244                    $size = (int)$stat['size'];
245                } else if (is_array($file)) {
246                    $size = (int)strlen(reset($file));
247                } else {
248                    $mtime = (int)$file->get_timemodified();
249                    $size = (int)$file->get_filesize();
250                }
251                $sizes[$archivepath] = $size;
252                $mtimes[$archivepath] = $mtime;
253
254                // Write a line in the index.
255                $list .= "$archivepath\t$type\t$size\t$mtime\n";
256            }
257
258            // The index file is optional; only write into archive if needed.
259            if ($this->includeindex) {
260                // Put the index file into the archive.
261                $this->write_tar_entry($gz, self::ARCHIVE_INDEX_FILE, null, strlen($list), '?', $list);
262            }
263
264            // Update progress ready for main stage.
265            $done = (int)(self::PROGRESS_MAX / 10);
266            if ($progress) {
267                $progress->progress($done, self::PROGRESS_MAX);
268            }
269            if ($expandedfiles) {
270                // The remaining 9/10ths of progress represents these files.
271                $progressperfile = (int)((9 * self::PROGRESS_MAX) / (10 * count($expandedfiles)));
272            } else {
273                $progressperfile = 1;
274            }
275
276            // Actually write entries for each file/directory.
277            foreach ($expandedfiles as $archivepath => $file) {
278                if (is_null($file)) {
279                    // Null entry indicates a directory.
280                    $this->write_tar_entry($gz, $archivepath, null,
281                            $sizes[$archivepath], $mtimes[$archivepath]);
282                } else if (is_string($file)) {
283                    // String indicates an OS file.
284                    $this->write_tar_entry($gz, $archivepath, $file,
285                            $sizes[$archivepath], $mtimes[$archivepath], null, $progress, $done);
286                } else if (is_array($file)) {
287                    // Array indicates in-memory data.
288                    $data = reset($file);
289                    $this->write_tar_entry($gz, $archivepath, null,
290                            $sizes[$archivepath], $mtimes[$archivepath], $data, $progress, $done);
291                } else {
292                    // Stored_file object.
293                    $this->write_tar_entry($gz, $archivepath, $file->get_content_file_handle(),
294                            $sizes[$archivepath], $mtimes[$archivepath], null, $progress, $done);
295                }
296                $done += $progressperfile;
297                if ($progress) {
298                    $progress->progress($done, self::PROGRESS_MAX);
299                }
300            }
301
302            // Finish tar file with two empty 512-byte records.
303            gzwrite($gz, str_pad('', 2 * self::TAR_BLOCK_SIZE, "\x00"));
304            gzclose($gz);
305            return true;
306        } catch (Exception $e) {
307            // If there is an exception, delete the in-progress file.
308            gzclose($gz);
309            unlink($archivefile);
310            throw $e;
311        }
312    }
313
314    /**
315     * Writes a single tar file to the archive, including its header record and
316     * then the file contents.
317     *
318     * @param resource $gz Gzip file
319     * @param string $archivepath Full path of file within archive
320     * @param string|resource $file Full path of file on disk or file handle or null if none
321     * @param int $size Size or 0 for directories
322     * @param int|string $mtime Time or ? if unknown
323     * @param string $content Actual content of file to write (null if using $filepath)
324     * @param file_progress $progress Progress indicator or null if none
325     * @param int $done Value for progress indicator
326     * @return bool True if OK
327     * @throws coding_exception If names aren't valid
328     */
329    protected function write_tar_entry($gz, $archivepath, $file, $size, $mtime, $content = null,
330            file_progress $progress = null, $done = 0) {
331        // Header based on documentation of POSIX ustar format from:
332        // http://www.freebsd.org/cgi/man.cgi?query=tar&sektion=5&manpath=FreeBSD+8-current .
333
334        // For directories, ensure name ends in a slash.
335        $directory = false;
336        if ($size === 0 && is_null($file)) {
337            $directory = true;
338            if (!preg_match('~/$~', $archivepath)) {
339                $archivepath .= '/';
340            }
341            $mode = '755';
342        } else {
343            $mode = '644';
344        }
345
346        // Split archivepath into name and prefix.
347        $name = $archivepath;
348        $prefix = '';
349        while (strlen($name) > 100) {
350            $slash = strpos($name, '/');
351            if ($slash === false) {
352                throw new coding_exception(
353                        'Name cannot fit length restrictions (> 100 characters): ' . $archivepath);
354            }
355
356            if ($prefix !== '') {
357                $prefix .= '/';
358            }
359            $prefix .= substr($name, 0, $slash);
360            $name = substr($name, $slash + 1);
361            if (strlen($prefix) > 155) {
362                throw new coding_exception(
363                        'Name cannot fit length restrictions (path too long): ' . $archivepath);
364            }
365        }
366
367        // Checksum performance is a bit slow because of having to call 'ord'
368        // lots of times (it takes about 1/3 the time of the actual gzwrite
369        // call). To improve performance of checksum calculation, we will
370        // store all the non-zero, non-fixed bytes that need adding to the
371        // checksum, and checksum only those bytes.
372        $forchecksum = $name;
373
374        // struct header_posix_ustar {
375        //    char name[100];
376        $header = str_pad($name, 100, "\x00");
377
378        //    char mode[8];
379        //    char uid[8];
380        //    char gid[8];
381        $header .= '0000' . $mode . "\x000000000\x000000000\x00";
382        $forchecksum .= $mode;
383
384        //    char size[12];
385        $octalsize = decoct($size);
386        if (strlen($octalsize) > 11) {
387            throw new coding_exception(
388                    'File too large for .tar file: ' . $archivepath . ' (' . $size . ' bytes)');
389        }
390        $paddedsize = str_pad($octalsize, 11, '0', STR_PAD_LEFT);
391        $forchecksum .= $paddedsize;
392        $header .= $paddedsize . "\x00";
393
394        //    char mtime[12];
395        if ($mtime === '?') {
396            // Use a default timestamp rather than zero; GNU tar outputs
397            // warnings about zeroes here.
398            $mtime = self::DEFAULT_TIMESTAMP;
399        }
400        $octaltime = decoct($mtime);
401        $paddedtime = str_pad($octaltime, 11, '0', STR_PAD_LEFT);
402        $forchecksum .= $paddedtime;
403        $header .= $paddedtime . "\x00";
404
405        //    char checksum[8];
406        // Checksum needs to be completed later.
407        $header .= '        ';
408
409        //    char typeflag[1];
410        $typeflag = $directory ? '5' : '0';
411        $forchecksum .= $typeflag;
412        $header .= $typeflag;
413
414        //    char linkname[100];
415        $header .= str_pad('', 100, "\x00");
416
417        //    char magic[6];
418        //    char version[2];
419        $header .= "ustar\x0000";
420
421        //    char uname[32];
422        //    char gname[32];
423        //    char devmajor[8];
424        //    char devminor[8];
425        $header .= str_pad('', 80, "\x00");
426
427        //    char prefix[155];
428        //    char pad[12];
429        $header .= str_pad($prefix, 167, "\x00");
430        $forchecksum .= $prefix;
431
432        // };
433
434        // We have now calculated the header, but without the checksum. To work
435        // out the checksum, sum all the bytes that aren't fixed or zero, and add
436        // to a standard value that contains all the fixed bytes.
437
438        // The fixed non-zero bytes are:
439        //
440        // '000000000000000000        ustar00'
441        // mode (except 3 digits), uid, gid, checksum space, magic number, version
442        //
443        // To calculate the number, call the calculate_checksum function on the
444        // above string. The result is 1775.
445        $checksum = 1775 + self::calculate_checksum($forchecksum);
446
447        $octalchecksum = str_pad(decoct($checksum), 6, '0', STR_PAD_LEFT) . "\x00 ";
448
449        // Slot it into place in the header.
450        $header = substr($header, 0, 148) . $octalchecksum . substr($header, 156);
451
452        if (strlen($header) != self::TAR_BLOCK_SIZE) {
453            throw new coding_exception('Header block wrong size!!!!!');
454        }
455
456        // Awesome, now write out the header.
457        gzwrite($gz, $header);
458
459        // Special pre-handler for OS filename.
460        if (is_string($file)) {
461            $file = fopen($file, 'rb');
462            if (!$file) {
463                return false;
464            }
465        }
466
467        if ($content !== null) {
468            // Write in-memory content if any.
469            if (strlen($content) !== $size) {
470                throw new coding_exception('Mismatch between provided sizes: ' . $archivepath);
471            }
472            gzwrite($gz, $content);
473        } else if ($file !== null) {
474            // Write file content if any, using a 64KB buffer.
475            $written = 0;
476            $chunks = 0;
477            while (true) {
478                $data = fread($file, 65536);
479                if ($data === false || strlen($data) == 0) {
480                    break;
481                }
482                $written += gzwrite($gz, $data);
483
484                // After every megabyte of large files, update the progress
485                // tracker (so there are no long gaps without progress).
486                $chunks++;
487                if ($chunks == 16) {
488                    $chunks = 0;
489                    if ($progress) {
490                        // This call always has the same values, but that gives
491                        // the tracker a chance to indicate indeterminate
492                        // progress and output something to avoid timeouts.
493                        $progress->progress($done, self::PROGRESS_MAX);
494                    }
495                }
496            }
497            fclose($file);
498
499            if ($written !== $size) {
500                throw new coding_exception('Mismatch between provided sizes: ' . $archivepath .
501                        ' (was ' . $written . ', expected ' . $size . ')');
502            }
503        } else if ($size != 0) {
504            throw new coding_exception('Missing data file handle for non-empty file');
505        }
506
507        // Pad out final 512-byte block in file, if applicable.
508        $leftover = self::TAR_BLOCK_SIZE - ($size % self::TAR_BLOCK_SIZE);
509        if ($leftover == 512) {
510            $leftover = 0;
511        } else {
512            gzwrite($gz, str_pad('', $leftover, "\x00"));
513        }
514
515        return true;
516    }
517
518    /**
519     * Calculates a checksum by summing all characters of the binary string
520     * (treating them as unsigned numbers).
521     *
522     * @param string $str Input string
523     * @return int Checksum
524     */
525    protected static function calculate_checksum($str) {
526        $checksum = 0;
527        $checklength = strlen($str);
528        for ($i = 0; $i < $checklength; $i++) {
529            $checksum += ord($str[$i]);
530        }
531        return $checksum;
532    }
533
534    /**
535     * Based on an OS path, adds either that path (if it's a file) or
536     * all its children (if it's a directory) into the list of files to
537     * archive.
538     *
539     * If a progress indicator is supplied and if this corresponds to a
540     * directory, then it will be repeatedly called with the same values. This
541     * allows the progress handler to respond in some way to avoid timeouts
542     * if required.
543     *
544     * @param array $expandedfiles List of all files to archive (output)
545     * @param string $archivepath Current path within archive
546     * @param string $path OS path on disk
547     * @param file_progress $progress Progress indicator or null if none
548     * @param int $done Value for progress indicator
549     * @return bool True if successful
550     */
551    protected function list_files_path(array &$expandedfiles, $archivepath, $path,
552            file_progress $progress = null, $done) {
553        if (is_dir($path)) {
554            // Unless we're using this directory as archive root, add a
555            // directory entry.
556            if ($archivepath != '') {
557                // Add directory-creation record.
558                $expandedfiles[$archivepath . '/'] = null;
559            }
560
561            // Loop through directory contents and recurse.
562            if (!$handle = opendir($path)) {
563                return false;
564            }
565            while (false !== ($entry = readdir($handle))) {
566                if ($entry === '.' || $entry === '..') {
567                    continue;
568                }
569                $result = $this->list_files_path($expandedfiles,
570                        $archivepath . '/' . $entry, $path . '/' . $entry,
571                        $progress, $done);
572                if (!$result) {
573                    return false;
574                }
575                if ($progress) {
576                    $progress->progress($done, self::PROGRESS_MAX);
577                }
578            }
579            closedir($handle);
580        } else {
581            // Just add it to list.
582            $expandedfiles[$archivepath] = $path;
583        }
584        return true;
585    }
586
587    /**
588     * Based on a stored_file objects, adds either that file (if it's a file) or
589     * all its children (if it's a directory) into the list of files to
590     * archive.
591     *
592     * If a progress indicator is supplied and if this corresponds to a
593     * directory, then it will be repeatedly called with the same values. This
594     * allows the progress handler to respond in some way to avoid timeouts
595     * if required.
596     *
597     * @param array $expandedfiles List of all files to archive (output)
598     * @param string $archivepath Current path within archive
599     * @param stored_file $file File object
600     */
601    protected function list_files_stored(array &$expandedfiles, $archivepath, stored_file $file) {
602        if ($file->is_directory()) {
603            // Add a directory-creation record.
604            $expandedfiles[$archivepath . '/'] = null;
605
606            // Loop through directory contents (this is a recursive collection
607            // of all children not just one directory).
608            $fs = get_file_storage();
609            $baselength = strlen($file->get_filepath());
610            $files = $fs->get_directory_files(
611                    $file->get_contextid(), $file->get_component(), $file->get_filearea(), $file->get_itemid(),
612                    $file->get_filepath(), true, true);
613            foreach ($files as $childfile) {
614                // Get full pathname after original part.
615                $path = $childfile->get_filepath();
616                $path = substr($path, $baselength);
617                $path = $archivepath . '/' . $path;
618                if ($childfile->is_directory()) {
619                    $childfile = null;
620                } else {
621                    $path .= $childfile->get_filename();
622                }
623                $expandedfiles[$path] = $childfile;
624            }
625        } else {
626            // Just add it to list.
627            $expandedfiles[$archivepath] = $file;
628        }
629    }
630
631    /**
632     * Extract file to given file path (real OS filesystem), existing files are overwritten.
633     *
634     * @param stored_file|string $archivefile full pathname of zip file or stored_file instance
635     * @param string $pathname target directory
636     * @param array $onlyfiles only extract files present in the array
637     * @param file_progress $progress Progress indicator callback or null if not required
638     * @param bool $returnbool Whether to return a basic true/false indicating error state, or full per-file error
639     * details.
640     * @return array list of processed files (name=>true)
641     * @throws moodle_exception If error
642     */
643    public function extract_to_pathname($archivefile, $pathname,
644            array $onlyfiles = null, file_progress $progress = null, $returnbool = false) {
645        $extractor = new tgz_extractor($archivefile);
646        try {
647            $result = $extractor->extract(
648                    new tgz_packer_extract_to_pathname($pathname, $onlyfiles), $progress);
649            if ($returnbool) {
650                if (!is_array($result)) {
651                    return false;
652                }
653                foreach ($result as $status) {
654                    if ($status !== true) {
655                        return false;
656                    }
657                }
658                return true;
659            } else {
660                return $result;
661            }
662        } catch (moodle_exception $e) {
663            if ($returnbool) {
664                return false;
665            } else {
666                throw $e;
667            }
668        }
669    }
670
671    /**
672     * Extract file to given file path (real OS filesystem), existing files are overwritten.
673     *
674     * @param string|stored_file $archivefile full pathname of zip file or stored_file instance
675     * @param int $contextid context ID
676     * @param string $component component
677     * @param string $filearea file area
678     * @param int $itemid item ID
679     * @param string $pathbase file path
680     * @param int $userid user ID
681     * @param file_progress $progress Progress indicator callback or null if not required
682     * @return array list of processed files (name=>true)
683     * @throws moodle_exception If error
684     */
685    public function extract_to_storage($archivefile, $contextid,
686            $component, $filearea, $itemid, $pathbase, $userid = null,
687            file_progress $progress = null) {
688        $extractor = new tgz_extractor($archivefile);
689        return $extractor->extract(
690                new tgz_packer_extract_to_storage($contextid, $component,
691                    $filearea, $itemid, $pathbase, $userid), $progress);
692    }
693
694    /**
695     * Returns array of info about all files in archive.
696     *
697     * @param string|stored_file $archivefile
698     * @return array of file infos
699     */
700    public function list_files($archivefile) {
701        $extractor = new tgz_extractor($archivefile);
702        return $extractor->list_files();
703    }
704
705    /**
706     * Checks whether a file appears to be a .tar.gz file.
707     *
708     * @param string|stored_file $archivefile
709     * @return bool True if file contains the gzip magic number
710     */
711    public static function is_tgz_file($archivefile) {
712        if (is_a($archivefile, 'stored_file')) {
713            $fp = $archivefile->get_content_file_handle();
714        } else {
715            $fp = fopen($archivefile, 'rb');
716        }
717        $firstbytes = fread($fp, 2);
718        fclose($fp);
719        return ($firstbytes[0] == "\x1f" && $firstbytes[1] == "\x8b");
720    }
721
722    /**
723     * The zlib extension is required for this packer to work. This is a single
724     * location for the code to check whether the extension is available.
725     *
726     * @deprecated since 2.7 Always true because zlib extension is now required.
727     *
728     * @return bool True if the zlib extension is available OK
729     */
730    public static function has_required_extension() {
731        return extension_loaded('zlib');
732    }
733}
734
735
736/**
737 * Handles extraction to pathname.
738 */
739class tgz_packer_extract_to_pathname implements tgz_extractor_handler {
740    /**
741     * @var string Target directory for extract.
742     */
743    protected $pathname;
744    /**
745     * @var array Array of files to extract (other files are skipped).
746     */
747    protected $onlyfiles;
748
749    /**
750     * Constructor.
751     *
752     * @param string $pathname target directory
753     * @param array $onlyfiles only extract files present in the array
754     */
755    public function __construct($pathname, array $onlyfiles = null) {
756        $this->pathname = $pathname;
757        $this->onlyfiles = $onlyfiles;
758    }
759
760    /**
761     * @see tgz_extractor_handler::tgz_start_file()
762     */
763    public function tgz_start_file($archivepath) {
764        // Check file restriction.
765        if ($this->onlyfiles !== null && !in_array($archivepath, $this->onlyfiles)) {
766            return null;
767        }
768        // Ensure directory exists and prepare filename.
769        $fullpath = $this->pathname . '/' . $archivepath;
770        check_dir_exists(dirname($fullpath));
771        return $fullpath;
772    }
773
774    /**
775     * @see tgz_extractor_handler::tgz_end_file()
776     */
777    public function tgz_end_file($archivepath, $realpath) {
778        // Do nothing.
779    }
780
781    /**
782     * @see tgz_extractor_handler::tgz_directory()
783     */
784    public function tgz_directory($archivepath, $mtime) {
785        // Check file restriction.
786        if ($this->onlyfiles !== null && !in_array($archivepath, $this->onlyfiles)) {
787            return false;
788        }
789        // Ensure directory exists.
790        $fullpath = $this->pathname . '/' . $archivepath;
791        check_dir_exists($fullpath);
792        return true;
793    }
794}
795
796
797/**
798 * Handles extraction to file storage.
799 */
800class tgz_packer_extract_to_storage implements tgz_extractor_handler {
801    /**
802     * @var string Path to temp file.
803     */
804    protected $tempfile;
805
806    /**
807     * @var int Context id for files.
808     */
809    protected $contextid;
810    /**
811     * @var string Component name for files.
812     */
813    protected $component;
814    /**
815     * @var string File area for files.
816     */
817    protected $filearea;
818    /**
819     * @var int Item ID for files.
820     */
821    protected $itemid;
822    /**
823     * @var string Base path for files (subfolders will go inside this).
824     */
825    protected $pathbase;
826    /**
827     * @var int User id for files or null if none.
828     */
829    protected $userid;
830
831    /**
832     * Constructor.
833     *
834     * @param int $contextid Context id for files.
835     * @param string $component Component name for files.
836     * @param string $filearea File area for files.
837     * @param int $itemid Item ID for files.
838     * @param string $pathbase Base path for files (subfolders will go inside this).
839     * @param int $userid User id for files or null if none.
840     */
841    public function __construct($contextid, $component, $filearea, $itemid, $pathbase, $userid) {
842        global $CFG;
843
844        // Store all data.
845        $this->contextid = $contextid;
846        $this->component = $component;
847        $this->filearea = $filearea;
848        $this->itemid = $itemid;
849        $this->pathbase = $pathbase;
850        $this->userid = $userid;
851
852        // Obtain temp filename.
853        $tempfolder = $CFG->tempdir . '/core_files';
854        check_dir_exists($tempfolder);
855        $this->tempfile = tempnam($tempfolder, '.dat');
856    }
857
858    /**
859     * @see tgz_extractor_handler::tgz_start_file()
860     */
861    public function tgz_start_file($archivepath) {
862        // All files are stored in the same filename.
863        return $this->tempfile;
864    }
865
866    /**
867     * @see tgz_extractor_handler::tgz_end_file()
868     */
869    public function tgz_end_file($archivepath, $realpath) {
870        // Place temp file into storage.
871        $fs = get_file_storage();
872        $filerecord = array('contextid' => $this->contextid, 'component' => $this->component,
873                'filearea' => $this->filearea, 'itemid' => $this->itemid);
874        $filerecord['filepath'] = $this->pathbase . dirname($archivepath) . '/';
875        $filerecord['filename'] = basename($archivepath);
876        if ($this->userid) {
877            $filerecord['userid'] = $this->userid;
878        }
879        // Delete existing file (if any) and create new one.
880        tgz_packer::delete_existing_file_record($fs, $filerecord);
881        $fs->create_file_from_pathname($filerecord, $this->tempfile);
882        unlink($this->tempfile);
883    }
884
885    /**
886     * @see tgz_extractor_handler::tgz_directory()
887     */
888    public function tgz_directory($archivepath, $mtime) {
889        // Standardise path.
890        if (!preg_match('~/$~', $archivepath)) {
891            $archivepath .= '/';
892        }
893        // Create directory if it doesn't already exist.
894        $fs = get_file_storage();
895        if (!$fs->file_exists($this->contextid, $this->component, $this->filearea, $this->itemid,
896                $this->pathbase . $archivepath, '.')) {
897            $fs->create_directory($this->contextid, $this->component, $this->filearea, $this->itemid,
898                    $this->pathbase . $archivepath);
899        }
900        return true;
901    }
902}
903