diff --git a/safaribook/spiders/safaribooks.py b/safaribook/spiders/safaribooks.py index 53ae048..d045d9d 100644 --- a/safaribook/spiders/safaribooks.py +++ b/safaribook/spiders/safaribooks.py @@ -92,7 +92,7 @@ def parse_page(self, title, bookid, path, response): def parse_toc(self, response): toc = eval(response.body) self.book_name = toc['title_safe'] - self.book_title = toc['title'].replace(' ','_').replace(':',' -') # to be used for filename + self.book_title = re.sub(r'["%*/:<>?\\|~\s]', r'_', toc['title']) # to be used for filename cover_path, = re.match(r'