Thanks to visit codestin.com Credit goes to github.com
We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d2ec132 commit 9a08f7fCopy full SHA for 9a08f7f
1 file changed
lib/core/common.py
@@ -1128,7 +1128,9 @@ def preparePageForLineComparison(page):
1128
def getFilteredPageContent(page):
1129
retVal = page
1130
if isinstance(page, basestring):
1131
- retVal = re.sub(r"(?s)<script.+?</script>|<style.+?</style>|<[^>]+>|\t|\n|\r", "", page)
+ retVal = re.sub(r"(?s)<script.+?</script>|<style.+?</style>|<[^>]+>|\t|\n|\r", " ", page)
1132
+ while retVal.find(" ") != -1:
1133
+ retVal = retVal.replace(" ", " ")
1134
return retVal
1135
1136
def getPageTextWordsSet(page):
0 commit comments