We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent e567698 commit 2a6f33cCopy full SHA for 2a6f33c
1 file changed
playwright_news_crawler/daum_news_parser.py
@@ -8,6 +8,7 @@
8
from datetime import datetime, timezone, timedelta
9
from bs4 import BeautifulSoup
10
import logging
11
+import boto3
12
13
class DaumNewsParser:
14
def __init__(self):
@@ -28,6 +29,8 @@ def __init__(self):
28
29
"Referer": "https://news.daum.net/",
30
}
31
32
+ self.s3_client = boto3.client("s3")
33
+
34
self.NAME_MATCH_RE = re.compile(r"^[가-힣]{2,3}$")
35
self.EMAIL_END_RE = re.compile(r"\(?[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Za-z]{2,}\)?$")
36
self.CLEAN_WS = re.compile(r"\s+")
0 commit comments