summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorBenjamin Brahmer <info@b-brahmer.de>2023-01-10 12:28:10 +0100
committerBenjamin Brahmer <info@b-brahmer.de>2023-01-11 10:19:34 +0100
commit0dfd93f75df2997568907474ab9d4d2a89e53dd5 (patch)
treef86175297f03b1db39fcb89dcd25963ee910ab43
parent343aa5e2f79b5cfe4b4d780d4ce4573da03045cd (diff)
Workaround for #2048
The league/uri version that we inherit in Nextcloud is a bit outdated. That version can't handle certain uris. Signed-off-by: Benjamin Brahmer <info@b-brahmer.de>
-rw-r--r--CHANGELOG.md1
-rw-r--r--lib/Scraper/Scraper.php7
2 files changed, 7 insertions, 1 deletions
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 4ff2d1c05..061ad1475 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -7,6 +7,7 @@ The format is mostly based on [Keep a Changelog](https://keepachangelog.com/en/1
### Changed
### Fixed
+- SyntaxError triggered when full-text is enabled with some items. (#2048, #2053)
# Releases
## [20.0.0] - 2022-12-14
diff --git a/lib/Scraper/Scraper.php b/lib/Scraper/Scraper.php
index 5deac358e..998c4464c 100644
--- a/lib/Scraper/Scraper.php
+++ b/lib/Scraper/Scraper.php
@@ -14,6 +14,7 @@ namespace OCA\News\Scraper;
use fivefilters\Readability\Readability;
use fivefilters\Readability\Configuration;
use fivefilters\Readability\ParseException;
+use League\Uri\Exceptions\SyntaxError;
use Psr\Log\LoggerInterface;
class Scraper implements IScraper
@@ -74,10 +75,14 @@ class Scraper implements IScraper
try {
$this->readability->parse($content);
- } catch (ParseException $e) {
+ } catch (ParseException | SyntaxError $e) {
$this->logger->error('Unable to parse content from {url}', [
'url' => $url,
]);
+ $this->logger->debug('Error during parsing of {url} ran into {error}', [
+ 'url' => $url,
+ 'error' => $e,
+ ]);
}
return true;
}