-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathgetPttPostDemo.R
34 lines (22 loc) · 979 Bytes
/
getPttPostDemo.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
# library(devtools)
# install_github("agilearning/RPTT")
library(RPTT)
listPageUrls = getListPageUrls("Gossiping")[1:5]
listPageUrls
postUrls = unlist(lapply(listPageUrls,getPostUrls))
postUrls
getPostData("https://www.ptt.cc/bbs/Gossiping/M.1431338763.A.1BF.html")
getPostData(postUrls[2])
postData = lapply(postUrls[3:5],getPostData)
postDf = data.frame(do.call(rbind,lapply(postData,function(xx) xx$postData)))
pushDf = do.call(rbind,lapply(postData,function(xx) xx$pushDf))
postData = lapply(postUrls,getPostData)
postData = lapply(postUrls, function(url) try(getPostData(url),TRUE))
sapply(postData, function(x) class(x))
sapply(postData, function(x) class(x)) != "try-error"
error_idx = which(sapply(postData, function(x) class(x)) == "try-error")
data_idx = which(sapply(postData, function(x) class(x)) != "try-error")
data = postData[data_idx]
postDf = data.frame(do.call(rbind,lapply(postData[data_idx],function(xx) xx$postData )))
View(postDf)
postDf$Title