From 09b4040578f5aec9a203dda2caeab0ab0f1fc152 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Mi=C5=A1o=20Belica?= Date: Thu, 28 Nov 2013 11:50:48 +0100 Subject: [PATCH] Append sibling node only when it doesn't already exist --- CHANGELOG.rst | 1 + readability/readable.py | 3 ++- 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/CHANGELOG.rst b/CHANGELOG.rst index 36ecf26..298ae4e 100644 --- a/CHANGELOG.rst +++ b/CHANGELOG.rst @@ -2,6 +2,7 @@ Changelog for readability ========================== +- Sibling node is appended only when sibling doesn't already exist. - Treat images a little differently so they get more inclusion. - Added User-Agent string into HTTP requests. - Added property ``Article.main_text`` for getting text annotated with diff --git a/readability/readable.py b/readability/readable.py index e8f6bdd..ad5c02f 100644 --- a/readability/readable.py +++ b/readability/readable.py @@ -154,7 +154,8 @@ def check_siblings(candidate_node, candidate_list): # filtered out later by accident. sibling.tag = "div" - candidate_node.node.append(sibling) + if candidate_node.node != sibling: + candidate_node.node.append(sibling) return candidate_node