mirror of
https://git.tt-rss.org/git/tt-rss.git
synced 2025-12-13 11:45:56 +00:00
move readability library to af_readability/vendor out of global vendor directory
af_redditimgur: use HOOK_GET_FULL_TEXT instead of invoking readability directly
This commit is contained in:
@@ -1,7 +1,4 @@
|
|||||||
<?php
|
<?php
|
||||||
use andreskrey\Readability\Readability;
|
|
||||||
use andreskrey\Readability\Configuration;
|
|
||||||
|
|
||||||
class Af_RedditImgur extends Plugin {
|
class Af_RedditImgur extends Plugin {
|
||||||
|
|
||||||
/* @var PluginHost $host */
|
/* @var PluginHost $host */
|
||||||
@@ -551,47 +548,16 @@ class Af_RedditImgur extends Plugin {
|
|||||||
parse it which p much requires curl */
|
parse it which p much requires curl */
|
||||||
|
|
||||||
$useragent_compat = "Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.1; WOW64; Trident/6.0)";
|
$useragent_compat = "Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.1; WOW64; Trident/6.0)";
|
||||||
|
|
||||||
$content_type = $this->get_content_type($url, $useragent_compat);
|
$content_type = $this->get_content_type($url, $useragent_compat);
|
||||||
|
|
||||||
if ($content_type && strpos($content_type, "text/html") !== FALSE) {
|
if ($content_type && strpos($content_type, "text/html") !== FALSE) {
|
||||||
|
|
||||||
$tmp = fetch_file_contents(["url" => $url,
|
foreach ($this->host->get_hooks(PluginHost::HOOK_GET_FULL_TEXT) as $p) {
|
||||||
"useragent" => $useragent_compat,
|
$extracted_content = $p->hook_get_full_text($url);
|
||||||
"http_accept" => "text/html"]);
|
|
||||||
|
|
||||||
Debug::log("tmplen: " . mb_strlen($tmp), Debug::$LOG_VERBOSE);
|
if ($extracted_content) {
|
||||||
|
$article["content"] = $extracted_content;
|
||||||
if ($tmp && mb_strlen($tmp) < 1024 * 500) {
|
break;
|
||||||
|
|
||||||
$r = new Readability(new Configuration());
|
|
||||||
|
|
||||||
try {
|
|
||||||
if ($r->parse($tmp)) {
|
|
||||||
|
|
||||||
$tmpxpath = new DOMXPath($r->getDOMDocument());
|
|
||||||
|
|
||||||
$entries = $tmpxpath->query('(//a[@href]|//img[@src])');
|
|
||||||
|
|
||||||
foreach ($entries as $entry) {
|
|
||||||
if ($entry->hasAttribute("href")) {
|
|
||||||
$entry->setAttribute("href",
|
|
||||||
rewrite_relative_url($url, $entry->getAttribute("href")));
|
|
||||||
|
|
||||||
}
|
|
||||||
|
|
||||||
if ($entry->hasAttribute("src")) {
|
|
||||||
$entry->setAttribute("src",
|
|
||||||
rewrite_relative_url($url, $entry->getAttribute("src")));
|
|
||||||
|
|
||||||
}
|
|
||||||
|
|
||||||
}
|
|
||||||
|
|
||||||
$article["content"] = $r->getContent() . "<hr/>" . $article["content"];
|
|
||||||
}
|
|
||||||
} catch (Exception $e) {
|
|
||||||
//
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
Reference in New Issue
Block a user