X-Git-Url: https://git.immae.eu/?a=blobdiff_plain;f=inc%2Ffunctions.php;h=68c3612f1952628d154ca14cb1e4ad16d4344747;hb=07a192525d19bcafc11bc68d62c30d2d4846faee;hp=0b9eb93697f291150e21d2669b6e05d30946f9cf;hpb=3c8d80aec5f5ba15910014bb4dcb48e948041ec9;p=github%2Fwallabag%2Fwallabag.git diff --git a/inc/functions.php b/inc/functions.php old mode 100755 new mode 100644 index 0b9eb936..68c3612f --- a/inc/functions.php +++ b/inc/functions.php @@ -3,7 +3,7 @@ /** * Permet de générer l'URL de poche pour le bookmarklet */ -function url() +function get_poche_url() { $protocol = "http"; if(isset($_SERVER['HTTPS'])) { @@ -15,32 +15,10 @@ function url() return $protocol . "://" . $_SERVER['HTTP_HOST'] . $_SERVER['REQUEST_URI']; } -/** - * Génération de la page "vue d'un article" - */ -function generate_page($entry) -{ - raintpl::$tpl_dir = './tpl/'; - raintpl::$cache_dir = "./cache/"; - raintpl::$base_url = url(); - raintpl::configure( 'path_replace', false ); - raintpl::configure('debug', false); - - $tpl = new raintpl(); - - $tpl->assign("id", $entry['id']); - $tpl->assign("url", $entry['url']); - $tpl->assign("title", $entry['title']); - $tpl->assign("content", $entry['content']); - $tpl->assign("is_fav", $entry['is_fav']); - $tpl->assign("is_read", $entry['is_read']); - - $tpl->draw( "index"); -} - // function define to retrieve url content -function get_external_file($url, $timeout) +function get_external_file($url) { + $timeout = 15; // spoofing FireFox 18.0 $useragent="Mozilla/5.0 (Windows NT 5.1; rv:18.0) Gecko/20100101 Firefox/18.0"; @@ -68,14 +46,10 @@ function get_external_file($url, $timeout) } else { // create http context and add timeout and user-agent - $context = stream_context_create(array('http'=>array('timeout' => $timeout, // Timeout : time until we stop waiting for the response. - 'header'=> "User-Agent: ".$useragent, // spoot Mozilla Firefox - 'follow_location' => true - ))); + $context = stream_context_create(array('http'=>array('timeout' => $timeout,'header'=> "User-Agent: ".$useragent,/*spoot Mozilla Firefox*/'follow_location' => true))); // only download page lesser than 4MB $data = @file_get_contents($url, false, $context, -1, 4000000); // We download at most 4 MB from source. - // echo "
http_response_header : ".print_r($http_response_header); if(isset($http_response_header) and isset($http_response_header[0])) { $httpcodeOK = isset($http_response_header) and isset($http_response_header[0]) and ((strpos($http_response_header[0], '200 OK') !== FALSE) or (strpos($http_response_header[0], '301 Moved Permanently') !== FALSE)); @@ -111,7 +85,10 @@ function get_external_file($url, $timeout) } } -function prepare_url($url) +/** + * Préparation de l'URL avec récupération du contenu avant insertion en base + */ +function prepare_url($url, $id) { $parametres = array(); $url = html_entity_decode(trim($url)); @@ -130,14 +107,308 @@ function prepare_url($url) if (isset($html) and strlen($html) > 0) { $r = new Readability($html, $url); + $r->convertLinksToFootnotes = TRUE; if($r->init()) { - $title = $r->articleTitle->innerHTML; + $content = $r->articleContent->innerHTML; + $parametres['title'] = $r->articleTitle->innerHTML; + $parametres['content'] = filtre_picture($content, $url, $id); + return $parametres; + } + } + + logm('error during url preparation'); + return FALSE; +} + +/** + * On modifie les URLS des images dans le corps de l'article + */ +function filtre_picture($content, $url, $id) +{ + $matches = array(); + preg_match_all('#<\s*(img)[^>]+src="([^"]*)"[^>]*>#Si', $content, $matches, PREG_SET_ORDER); + foreach($matches as $i => $link) + { + $link[1] = trim($link[1]); + if (!preg_match('#^(([a-z]+://)|(\#))#', $link[1]) ) + { + $absolute_path = get_absolute_link($link[2],$url); + $filename = basename(parse_url($absolute_path, PHP_URL_PATH)); + $directory = create_assets_directory($id); + $fullpath = $directory . '/' . $filename; + download_pictures($absolute_path, $fullpath); + $content = str_replace($matches[$i][2], $fullpath, $content); } + } - $parametres['title'] = $title; - $parametres['content'] = $r->articleContent->innerHTML; + return $content; +} + +/** + * Retourne le lien absolu + */ +function get_absolute_link($relative_link, $url) +{ + /* return if already absolute URL */ + if (parse_url($relative_link, PHP_URL_SCHEME) != '') return $relative_link; - return $parametres; + /* queries and anchors */ + if ($relative_link[0]=='#' || $relative_link[0]=='?') return $url . $relative_link; + + /* parse base URL and convert to local variables: + $scheme, $host, $path */ + extract(parse_url($url)); + + /* remove non-directory element from path */ + $path = preg_replace('#/[^/]*$#', '', $path); + + /* destroy path if relative url points to root */ + if ($relative_link[0] == '/') $path = ''; + + /* dirty absolute URL */ + $abs = $host . $path . '/' . $relative_link; + + /* replace '//' or '/./' or '/foo/../' with '/' */ + $re = array('#(/\.?/)#', '#/(?!\.\.)[^/]+/\.\./#'); + for($n=1; $n>0; $abs=preg_replace($re, '/', $abs, -1, $n)) {} + + /* absolute URL is ready! */ + return $scheme.'://'.$abs; +} + +/** + * Téléchargement des images + */ + +function download_pictures($absolute_path, $fullpath) +{ + $rawdata = get_external_file($absolute_path); + + if(file_exists($fullpath)) { + unlink($fullpath); + } + $fp = fopen($fullpath, 'x'); + fwrite($fp, $rawdata); + fclose($fp); +} + +/** + * Crée un répertoire de médias pour l'article + */ +function create_assets_directory($id) +{ + $assets_path = ABS_PATH; + if(!is_dir($assets_path)) { + mkdir($assets_path, 0705); + } + + $article_directory = $assets_path . $id; + if(!is_dir($article_directory)) { + mkdir($article_directory, 0705); + } + + return $article_directory; +} + +/** + * Suppression du répertoire d'images + */ +function remove_directory($directory) +{ + if(is_dir($directory)) { + $files = array_diff(scandir($directory), array('.','..')); + foreach ($files as $file) { + (is_dir("$directory/$file")) ? remove_directory("$directory/$file") : unlink("$directory/$file"); + } + return rmdir($directory); + } +} + +/** + * Appel d'une action (mark as fav, archive, delete) + */ + +function action_to_do($action, $id, $url, $token) +{ + global $db; + + switch ($action) + { + case 'add': + if ($url == '') + continue; + + $req = $db->getHandle()->query("SELECT id FROM entries ORDER BY id DESC"); + $id = $req->fetchColumn()+1; + + if($parametres_url = prepare_url($url, $id)) { + $sql_action = 'INSERT INTO entries ( id, url, title, content ) VALUES (?,?, ?, ?)'; + $params_action = array($id,$url, $parametres_url['title'], $parametres_url['content']); + } + + logm('add link ' . $url); + break; + case 'delete': + if (verif_token($token)) { + remove_directory(ABS_PATH . $id); + $sql_action = "DELETE FROM entries WHERE id=?"; + $params_action = array($id); + logm('delete link #' . $id); + } + else logm('csrf problem while deleting entry'); + break; + case 'toggle_fav' : + if (verif_token($token)) { + $sql_action = "UPDATE entries SET is_fav=~is_fav WHERE id=?"; + $params_action = array($id); + logm('mark as favorite link #' . $id); + } + else logm('csrf problem while fav entry'); + break; + case 'toggle_archive' : + if (verif_token($token)) { + $sql_action = "UPDATE entries SET is_read=~is_read WHERE id=?"; + $params_action = array($id); + logm('archive link #' . $id); + } + else logm('csrf problem while archive entry'); + break; + default: + break; + } + + try + { + # action query + if (isset($sql_action)) + { + $query = $db->getHandle()->prepare($sql_action); + $query->execute($params_action); + } + } + catch (Exception $e) + { + logm('action query error : '.$e->getMessage()); + } +} + +/** + * Détermine quels liens afficher : home, fav ou archives + */ +function display_view($view) +{ + global $db; + + switch ($_SESSION['sort']) + { + case 'ia': + $order = 'ORDER BY id'; + break; + case 'id': + $order = 'ORDER BY id DESC'; + break; + case 'ta': + $order = 'ORDER BY lower(title)'; + break; + case 'td': + $order = 'ORDER BY lower(title) DESC'; + break; + default: + $order = 'ORDER BY id'; + break; + } + + switch ($view) + { + case 'archive': + $sql = "SELECT * FROM entries WHERE is_read=? " . $order; + $params = array(-1); + break; + case 'fav' : + $sql = "SELECT * FROM entries WHERE is_fav=? " . $order; + $params = array(-1); + break; + default: + $sql = "SELECT * FROM entries WHERE is_read=? " . $order; + $params = array(0); + break; + } + + # view query + try + { + $query = $db->getHandle()->prepare($sql); + $query->execute($params); + $entries = $query->fetchAll(); + } + catch (Exception $e) + { + logm('view query error : '.$e->getMessage()); + } + + return $entries; +} + +/** + * Récupère un article en fonction d'un ID + */ +function get_article($id) +{ + global $db; + + $entry = NULL; + $sql = "SELECT * FROM entries WHERE id=?"; + $params = array(intval($id)); + + # view article query + try + { + $query = $db->getHandle()->prepare($sql); + $query->execute($params); + $entry = $query->fetchAll(); + } + catch (Exception $e) + { + logm('get article query error : '.$e->getMessage()); + } + + return $entry; +} + +/** + * Vérifie si le jeton passé en $_POST correspond à celui en session + */ +function verif_token($token) +{ + if(isset($_SESSION['token_poche']) && isset($_SESSION['token_time_poche']) && isset($token)) + { + if($_SESSION['token_poche'] == $token) + { + $old_timestamp = time() - (15*60); + if($_SESSION['token_time_poche'] >= $old_timestamp) + { + return TRUE; + } + else { + session_destroy(); + logm('session expired'); + } + } + else { + logm('token error : the token is different'); + return FALSE; + } + } + else { + logm('token error : the token is not here'); + return FALSE; + } +} + +function logm($message) +{ + $t = strval(date('Y/m/d_H:i:s')).' - '.$_SERVER["REMOTE_ADDR"].' - '.strval($message)."\n"; + file_put_contents('./log.txt',$t,FILE_APPEND); } \ No newline at end of file