dokuwiki/inc/io.php

835 lines
23 KiB
PHP

<?php
/**
* File IO functions
*
* @license GPL 2 (http://www.gnu.org/licenses/gpl.html)
* @author Andreas Gohr <andi@splitbrain.org>
*/
use dokuwiki\Utf8\PhpString;
use dokuwiki\HTTP\DokuHTTPClient;
use dokuwiki\Extension\Event;
/**
* Removes empty directories
*
* Sends IO_NAMESPACE_DELETED events for 'pages' and 'media' namespaces.
* Event data:
* $data[0] ns: The colon separated namespace path minus the trailing page name.
* $data[1] ns_type: 'pages' or 'media' namespace tree.
*
* @param string $id - a pageid, the namespace of that id will be tried to deleted
* @param string $basedir - the config name of the type to delete (datadir or mediadir usally)
* @return bool - true if at least one namespace was deleted
*
* @author Andreas Gohr <andi@splitbrain.org>
* @author Ben Coburn <btcoburn@silicodon.net>
*/
function io_sweepNS($id, $basedir = 'datadir')
{
global $conf;
$types = ['datadir' => 'pages', 'mediadir' => 'media'];
$ns_type = ($types[$basedir] ?? false);
$delone = false;
//scan all namespaces
while (($id = getNS($id)) !== false) {
$dir = $conf[$basedir] . '/' . utf8_encodeFN(str_replace(':', '/', $id));
//try to delete dir else return
if (@rmdir($dir)) {
if ($ns_type !== false) {
$data = [$id, $ns_type];
$delone = true; // we deleted at least one dir
Event::createAndTrigger('IO_NAMESPACE_DELETED', $data);
}
} else {
return $delone;
}
}
return $delone;
}
/**
* Used to read in a DokuWiki page from file, and send IO_WIKIPAGE_READ events.
*
* Generates the action event which delegates to io_readFile().
* Action plugins are allowed to modify the page content in transit.
* The file path should not be changed.
*
* Event data:
* $data[0] The raw arguments for io_readFile as an array.
* $data[1] ns: The colon separated namespace path minus the trailing page name. (false if root ns)
* $data[2] page_name: The wiki page name.
* $data[3] rev: The page revision, false for current wiki pages.
*
* @param string $file filename
* @param string $id page id
* @param bool|int|string $rev revision timestamp
* @return string
*
* @author Ben Coburn <btcoburn@silicodon.net>
*/
function io_readWikiPage($file, $id, $rev = false)
{
if (empty($rev)) {
$rev = false;
}
$data = [[$file, true], getNS($id), noNS($id), $rev];
return Event::createAndTrigger('IO_WIKIPAGE_READ', $data, '_io_readWikiPage_action', false);
}
/**
* Callback adapter for io_readFile().
*
* @param array $data event data
* @return string
*
* @author Ben Coburn <btcoburn@silicodon.net>
*/
function _io_readWikiPage_action($data)
{
if (is_array($data) && is_array($data[0]) && count($data[0]) === 2) {
return io_readFile(...$data[0]);
} else {
return ''; //callback error
}
}
/**
* Returns content of $file as cleaned string.
*
* Uses gzip if extension is .gz
*
* If you want to use the returned value in unserialize
* be sure to set $clean to false!
*
*
* @param string $file filename
* @param bool $clean
* @return string|bool the file contents or false on error
*
* @author Andreas Gohr <andi@splitbrain.org>
*/
function io_readFile($file, $clean = true)
{
$ret = '';
if (file_exists($file)) {
if (str_ends_with($file, '.gz')) {
if (!DOKU_HAS_GZIP) return false;
$ret = gzfile($file);
if (is_array($ret)) {
$ret = implode('', $ret);
}
} elseif (str_ends_with($file, '.bz2')) {
if (!DOKU_HAS_BZIP) return false;
$ret = bzfile($file);
} else {
$ret = file_get_contents($file);
}
}
if ($ret === null) return false;
if ($ret !== false && $clean) {
return cleanText($ret);
} else {
return $ret;
}
}
/**
* Returns the content of a .bz2 compressed file as string
*
* @param string $file filename
* @param bool $array return array of lines
* @return string|array|bool content or false on error
*
* @author marcel senf <marcel@rucksackreinigung.de>
* @author Andreas Gohr <andi@splitbrain.org>
*/
function bzfile($file, $array = false)
{
$bz = bzopen($file, "r");
if ($bz === false) return false;
if ($array) {
$lines = [];
}
$str = '';
while (!feof($bz)) {
//8192 seems to be the maximum buffersize?
$buffer = bzread($bz, 8192);
if (($buffer === false) || (bzerrno($bz) !== 0)) {
return false;
}
$str .= $buffer;
if ($array) {
$pos = strpos($str, "\n");
while ($pos !== false) {
$lines[] = substr($str, 0, $pos + 1);
$str = substr($str, $pos + 1);
$pos = strpos($str, "\n");
}
}
}
bzclose($bz);
if ($array) {
if ($str !== '') {
$lines[] = $str;
}
return $lines;
}
return $str;
}
/**
* Used to write out a DokuWiki page to file, and send IO_WIKIPAGE_WRITE events.
*
* This generates an action event and delegates to io_saveFile().
* Action plugins are allowed to modify the page content in transit.
* The file path should not be changed.
* (The append parameter is set to false.)
*
* Event data:
* $data[0] The raw arguments for io_saveFile as an array.
* $data[1] ns: The colon separated namespace path minus the trailing page name. (false if root ns)
* $data[2] page_name: The wiki page name.
* $data[3] rev: The page revision, false for current wiki pages.
*
* @param string $file filename
* @param string $content
* @param string $id page id
* @param int|bool|string $rev timestamp of revision
* @return bool
*
* @author Ben Coburn <btcoburn@silicodon.net>
*/
function io_writeWikiPage($file, $content, $id, $rev = false)
{
if (empty($rev)) {
$rev = false;
}
if ($rev === false) {
io_createNamespace($id); // create namespaces as needed
}
$data = [[$file, $content, false], getNS($id), noNS($id), $rev];
return Event::createAndTrigger('IO_WIKIPAGE_WRITE', $data, '_io_writeWikiPage_action', false);
}
/**
* Callback adapter for io_saveFile().
*
* @param array $data event data
* @return bool
*
* @author Ben Coburn <btcoburn@silicodon.net>
*/
function _io_writeWikiPage_action($data)
{
if (is_array($data) && is_array($data[0]) && count($data[0]) === 3) {
$ok = io_saveFile(...$data[0]);
// for attic files make sure the file has the mtime of the revision
if ($ok && is_int($data[3]) && $data[3] > 0) {
@touch($data[0][0], $data[3]);
}
return $ok;
} else {
return false; //callback error
}
}
/**
* Internal function to save contents to a file.
*
* @param string $file filename path to file
* @param string $content
* @param bool $append
* @return bool true on success, otherwise false
*
* @author Andreas Gohr <andi@splitbrain.org>
*/
function _io_saveFile($file, $content, $append)
{
global $conf;
$mode = ($append) ? 'ab' : 'wb';
$fileexists = file_exists($file);
if (str_ends_with($file, '.gz')) {
if (!DOKU_HAS_GZIP) return false;
$fh = @gzopen($file, $mode . '9');
if (!$fh) return false;
gzwrite($fh, $content);
gzclose($fh);
} elseif (str_ends_with($file, '.bz2')) {
if (!DOKU_HAS_BZIP) return false;
if ($append) {
$bzcontent = bzfile($file);
if ($bzcontent === false) return false;
$content = $bzcontent . $content;
}
$fh = @bzopen($file, 'w');
if (!$fh) return false;
bzwrite($fh, $content);
bzclose($fh);
} else {
$fh = @fopen($file, $mode);
if (!$fh) return false;
fwrite($fh, $content);
fclose($fh);
}
if (!$fileexists && $conf['fperm']) {
chmod($file, $conf['fperm']);
}
return true;
}
/**
* Saves $content to $file.
*
* If the third parameter is set to true the given content
* will be appended.
*
* Uses gzip if extension is .gz
* and bz2 if extension is .bz2
*
* @param string $file filename path to file
* @param string $content
* @param bool $append
* @return bool true on success, otherwise false
*
* @author Andreas Gohr <andi@splitbrain.org>
*/
function io_saveFile($file, $content, $append = false)
{
io_makeFileDir($file);
io_lock($file);
if (!_io_saveFile($file, $content, $append)) {
msg("Writing $file failed", -1);
io_unlock($file);
return false;
}
io_unlock($file);
return true;
}
/**
* Replace one or more occurrences of a line in a file.
*
* The default, when $maxlines is 0 is to delete all matching lines then append a single line.
* A regex that matches any part of the line will remove the entire line in this mode.
* Captures in $newline are not available.
*
* Otherwise each line is matched and replaced individually, up to the first $maxlines lines
* or all lines if $maxlines is -1. If $regex is true then captures can be used in $newline.
*
* Be sure to include the trailing newline in $oldline when replacing entire lines.
*
* Uses gzip if extension is .gz
* and bz2 if extension is .bz2
*
* @param string $file filename
* @param string $oldline exact linematch to remove
* @param string $newline new line to insert
* @param bool $regex use regexp?
* @param int $maxlines number of occurrences of the line to replace
* @return bool true on success
*
* @author Steven Danz <steven-danz@kc.rr.com>
* @author Christopher Smith <chris@jalakai.co.uk>
* @author Patrick Brown <ptbrown@whoopdedo.org>
*/
function io_replaceInFile($file, $oldline, $newline, $regex = false, $maxlines = 0)
{
if ((string)$oldline === '') {
trigger_error('$oldline parameter cannot be empty in io_replaceInFile()', E_USER_WARNING);
return false;
}
if (!file_exists($file)) return true;
io_lock($file);
// load into array
if (str_ends_with($file, '.gz')) {
if (!DOKU_HAS_GZIP) return false;
$lines = gzfile($file);
} elseif (str_ends_with($file, '.bz2')) {
if (!DOKU_HAS_BZIP) return false;
$lines = bzfile($file, true);
} else {
$lines = file($file);
}
// make non-regexes into regexes
$pattern = $regex ? $oldline : '/^' . preg_quote($oldline, '/') . '$/';
$replace = $regex ? $newline : addcslashes($newline, '\$');
// remove matching lines
if ($maxlines > 0) {
$count = 0;
$matched = 0;
foreach ($lines as $i => $line) {
if ($count >= $maxlines) break;
// $matched will be set to 0|1 depending on whether pattern is matched and line replaced
$lines[$i] = preg_replace($pattern, $replace, $line, -1, $matched);
if ($matched) {
$count++;
}
}
} elseif ($maxlines == 0) {
$lines = preg_grep($pattern, $lines, PREG_GREP_INVERT);
if ((string)$newline !== '') {
$lines[] = $newline;
}
} else {
$lines = preg_replace($pattern, $replace, $lines);
}
if (count($lines)) {
if (!_io_saveFile($file, implode('', $lines), false)) {
msg("Removing content from $file failed", -1);
io_unlock($file);
return false;
}
} else {
@unlink($file);
}
io_unlock($file);
return true;
}
/**
* Delete lines that match $badline from $file.
*
* Be sure to include the trailing newline in $badline
*
* @param string $file filename
* @param string $badline exact linematch to remove
* @param bool $regex use regexp?
* @return bool true on success
*
* @author Patrick Brown <ptbrown@whoopdedo.org>
*/
function io_deleteFromFile($file, $badline, $regex = false)
{
return io_replaceInFile($file, $badline, '', $regex, 0);
}
/**
* Tries to lock a file
*
* Locking is only done for io_savefile and uses directories
* inside $conf['lockdir']
*
* It waits maximal 3 seconds for the lock, after this time
* the lock is assumed to be stale and the function goes on
*
* @param string $file filename
*
* @author Andreas Gohr <andi@splitbrain.org>
*/
function io_lock($file)
{
global $conf;
$lockDir = $conf['lockdir'] . '/' . md5($file);
@ignore_user_abort(1);
$timeStart = time();
do {
//waited longer than 3 seconds? -> stale lock
if ((time() - $timeStart) > 3) break;
$locked = @mkdir($lockDir);
if ($locked) {
if ($conf['dperm']) {
chmod($lockDir, $conf['dperm']);
}
break;
}
usleep(50);
} while ($locked === false);
}
/**
* Unlocks a file
*
* @param string $file filename
*
* @author Andreas Gohr <andi@splitbrain.org>
*/
function io_unlock($file)
{
global $conf;
$lockDir = $conf['lockdir'] . '/' . md5($file);
@rmdir($lockDir);
@ignore_user_abort(0);
}
/**
* Create missing namespace directories and send the IO_NAMESPACE_CREATED events
* in the order of directory creation. (Parent directories first.)
*
* Event data:
* $data[0] ns: The colon separated namespace path minus the trailing page name.
* $data[1] ns_type: 'pages' or 'media' namespace tree.
*
* @param string $id page id
* @param string $ns_type 'pages' or 'media'
*
* @author Ben Coburn <btcoburn@silicodon.net>
*/
function io_createNamespace($id, $ns_type = 'pages')
{
// verify ns_type
$types = ['pages' => 'wikiFN', 'media' => 'mediaFN'];
if (!isset($types[$ns_type])) {
trigger_error('Bad $ns_type parameter for io_createNamespace().');
return;
}
// make event list
$missing = [];
$ns_stack = explode(':', $id);
$ns = $id;
$tmp = dirname($file = call_user_func($types[$ns_type], $ns));
while (!@is_dir($tmp) && !(file_exists($tmp) && !is_dir($tmp))) {
array_pop($ns_stack);
$ns = implode(':', $ns_stack);
if (strlen($ns) == 0) {
break;
}
$missing[] = $ns;
$tmp = dirname(call_user_func($types[$ns_type], $ns));
}
// make directories
io_makeFileDir($file);
// send the events
$missing = array_reverse($missing); // inside out
foreach ($missing as $ns) {
$data = [$ns, $ns_type];
Event::createAndTrigger('IO_NAMESPACE_CREATED', $data);
}
}
/**
* Create the directory needed for the given file
*
* @param string $file file name
*
* @author Andreas Gohr <andi@splitbrain.org>
*/
function io_makeFileDir($file)
{
$dir = dirname($file);
if (!@is_dir($dir)) {
if (!io_mkdir_p($dir)) {
msg("Creating directory $dir failed", -1);
}
}
}
/**
* Creates a directory hierachy.
*
* @param string $target filename
* @return bool
*
* @link http://php.net/manual/en/function.mkdir.php
* @author <saint@corenova.com>
* @author Andreas Gohr <andi@splitbrain.org>
*/
function io_mkdir_p($target)
{
global $conf;
if (@is_dir($target) || empty($target)) return true; // best case check first
if (file_exists($target) && !is_dir($target)) return false;
//recursion
if (io_mkdir_p(substr($target, 0, strrpos($target, '/')))) {
$ret = @mkdir($target); // crawl back up & create dir tree
if ($ret && !empty($conf['dperm'])) {
chmod($target, $conf['dperm']);
}
return $ret;
}
return false;
}
/**
* Recursively delete a directory
*
* @param string $path
* @param bool $removefiles defaults to false which will delete empty directories only
* @return bool
*
* @author Andreas Gohr <andi@splitbrain.org>
*/
function io_rmdir($path, $removefiles = false)
{
if (!is_string($path) || $path == "") return false;
if (!file_exists($path)) return true; // it's already gone or was never there, count as success
if (is_dir($path) && !is_link($path)) {
$dirs = [];
$files = [];
if (!$dh = @opendir($path)) return false;
while (false !== ($f = readdir($dh))) {
if ($f == '..' || $f == '.') continue;
// collect dirs and files first
if (is_dir("$path/$f") && !is_link("$path/$f")) {
$dirs[] = "$path/$f";
} elseif ($removefiles) {
$files[] = "$path/$f";
} else {
return false; // abort when non empty
}
}
closedir($dh);
// now traverse into directories first
foreach ($dirs as $dir) {
if (!io_rmdir($dir, $removefiles)) return false; // abort on any error
}
// now delete files
foreach ($files as $file) {
if (!@unlink($file)) return false; //abort on any error
}
// remove self
return @rmdir($path);
} elseif ($removefiles) {
return @unlink($path);
}
return false;
}
/**
* Creates a unique temporary directory and returns
* its path.
*
* @return false|string path to new directory or false
* @throws Exception
*
* @author Michael Klier <chi@chimeric.de>
*/
function io_mktmpdir()
{
global $conf;
$base = $conf['tmpdir'];
$dir = md5(uniqid(random_int(0, mt_getrandmax()), true));
$tmpdir = $base . '/' . $dir;
if (io_mkdir_p($tmpdir)) {
return $tmpdir;
} else {
return false;
}
}
/**
* downloads a file from the net and saves it
*
* if $useAttachment is false,
* - $file is the full filename to save the file, incl. path
* - if successful will return true, false otherwise
*
* if $useAttachment is true,
* - $file is the directory where the file should be saved
* - if successful will return the name used for the saved file, false otherwise
*
* @param string $url url to download
* @param string $file path to file or directory where to save
* @param bool $useAttachment true: try to use name of download, uses otherwise $defaultName
* false: uses $file as path to file
* @param string $defaultName fallback for if using $useAttachment
* @param int $maxSize maximum file size
* @return bool|string if failed false, otherwise true or the name of the file in the given dir
*
* @author Andreas Gohr <andi@splitbrain.org>
* @author Chris Smith <chris@jalakai.co.uk>
*/
function io_download($url, $file, $useAttachment = false, $defaultName = '', $maxSize = 2_097_152)
{
global $conf;
$http = new DokuHTTPClient();
$http->max_bodysize = $maxSize;
$http->timeout = 25; //max. 25 sec
$http->keep_alive = false; // we do single ops here, no need for keep-alive
$data = $http->get($url);
if (!$data) return false;
$name = '';
if ($useAttachment) {
if (isset($http->resp_headers['content-disposition'])) {
$content_disposition = $http->resp_headers['content-disposition'];
$match = [];
if (
is_string($content_disposition) &&
preg_match('/attachment;\s*filename\s*=\s*"([^"]*)"/i', $content_disposition, $match)
) {
$name = PhpString::basename($match[1]);
}
}
if (!$name) {
if (!$defaultName) return false;
$name = $defaultName;
}
$file .= $name;
}
$fileexists = file_exists($file);
$fp = @fopen($file, "w");
if (!$fp) return false;
fwrite($fp, $data);
fclose($fp);
if (!$fileexists && $conf['fperm']) {
chmod($file, $conf['fperm']);
}
if ($useAttachment) return $name;
return true;
}
/**
* Windows compatible rename
*
* rename() can not overwrite existing files on Windows
* this function will use copy/unlink instead
*
* @param string $from
* @param string $to
* @return bool succes or fail
*/
function io_rename($from, $to)
{
global $conf;
if (!@rename($from, $to)) {
if (@copy($from, $to)) {
if ($conf['fperm']) {
chmod($to, $conf['fperm']);
}
@unlink($from);
return true;
}
return false;
}
return true;
}
/**
* Runs an external command with input and output pipes.
* Returns the exit code from the process.
*
* @param string $cmd
* @param string $input input pipe
* @param string $output output pipe
* @return int exit code from process
*
* @author Tom N Harris <tnharris@whoopdedo.org>
*/
function io_exec($cmd, $input, &$output)
{
$descspec = [
0 => ["pipe", "r"],
1 => ["pipe", "w"],
2 => ["pipe", "w"]
];
$ph = proc_open($cmd, $descspec, $pipes);
if (!$ph) return -1;
fclose($pipes[2]); // ignore stderr
fwrite($pipes[0], $input);
fclose($pipes[0]);
$output = stream_get_contents($pipes[1]);
fclose($pipes[1]);
return proc_close($ph);
}
/**
* Search a file for matching lines
*
* This is probably not faster than file()+preg_grep() but less
* memory intensive because not the whole file needs to be loaded
* at once.
*
* @param string $file The file to search
* @param string $pattern PCRE pattern
* @param int $max How many lines to return (0 for all)
* @param bool $backref When true returns array with backreferences instead of lines
* @return array matching lines or backref, false on error
*
* @author Andreas Gohr <andi@splitbrain.org>
*/
function io_grep($file, $pattern, $max = 0, $backref = false)
{
$fh = @fopen($file, 'r');
if (!$fh) return false;
$matches = [];
$cnt = 0;
$line = '';
while (!feof($fh)) {
$line .= fgets($fh, 4096); // read full line
if (!str_ends_with($line, "\n")) continue;
// check if line matches
if (preg_match($pattern, $line, $match)) {
if ($backref) {
$matches[] = $match;
} else {
$matches[] = $line;
}
$cnt++;
}
if ($max && $max == $cnt) break;
$line = '';
}
fclose($fh);
return $matches;
}
/**
* Get size of contents of a file, for a compressed file the uncompressed size
* Warning: reading uncompressed size of content of bz-files requires uncompressing
*
* @param string $file filename path to file
* @return int size of file
*
* @author Gerrit Uitslag <klapinklapin@gmail.com>
*/
function io_getSizeFile($file)
{
if (!file_exists($file)) return 0;
if (str_ends_with($file, '.gz')) {
$fp = @fopen($file, "rb");
if ($fp === false) return 0;
fseek($fp, -4, SEEK_END);
$buffer = fread($fp, 4);
fclose($fp);
$array = unpack("V", $buffer);
$uncompressedsize = end($array);
} elseif (str_ends_with($file, '.bz2')) {
if (!DOKU_HAS_BZIP) return 0;
$bz = bzopen($file, "r");
if ($bz === false) return 0;
$uncompressedsize = 0;
while (!feof($bz)) {
//8192 seems to be the maximum buffersize?
$buffer = bzread($bz, 8192);
if (($buffer === false) || (bzerrno($bz) !== 0)) {
return 0;
}
$uncompressedsize += strlen($buffer);
}
} else {
$uncompressedsize = filesize($file);
}
return $uncompressedsize;
}