diff --git a/lib/core/common.py b/lib/core/common.py index 972ed3d1b..e63700264 100644 --- a/lib/core/common.py +++ b/lib/core/common.py @@ -1589,7 +1589,7 @@ def getFilteredPageContent(page, onlyText=True): return retVal def getPageWordSet(page): - retVal = None + retVal = set() # only if the page's charset has been successfully identified if isinstance(page, unicode):