Thanks to visit codestin.com
Credit goes to github.com

Skip to content

Commit 66b8ce3

Browse files
committed
配置化
1 parent 98c3c6a commit 66b8ce3

File tree

5 files changed

+10
-4
lines changed

5 files changed

+10
-4
lines changed

config/db.sql

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -290,6 +290,7 @@ CREATE TABLE IF NOT EXISTS `crawl_rule` (
290290
`author` varchar(127) NOT NULL DEFAULT '' COMMENT '文章作者规则',
291291
`pub_date` varchar(127) NOT NULL DEFAULT '' COMMENT '发布时间规则',
292292
`content` varchar(127) NOT NULL DEFAULT '' COMMENT '正文规则',
293+
`ext` varchar(1022) NOT NULL DEFAULT '' COMMENT '扩展,比如附加 css 等,json格式',
293294
`op_user` varchar(20) NOT NULL DEFAULT '' COMMENT '操作人',
294295
`ctime` timestamp NOT NULL DEFAULT CURRENT_TIMESTAMP ON UPDATE CURRENT_TIMESTAMP,
295296
PRIMARY KEY (`id`),

config/env.sample.ini

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -58,6 +58,9 @@ spec = 0 0 */1 * * ?
5858
iframe_deny = github.com,robbinfan.com,www.zhihu.com,google.com,golang.org,evernote.com,blogspot.com
5959
reddit_path = /r/golang/new/
6060
project_url = http://www.oschina.net/project/lang/358/go?tag=0&os=0&sort=time
61+
article_title_pattern = (?i)go|golang|goroutine|channel
62+
preset_users = polaris
63+
preset_uids = 1
6164

6265
[search]
6366
engine_url = http://127.0.0.1:7070/solr/studygolang

src/http/controller/admin/project.go

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -76,7 +76,7 @@ func (ProjectController) CrawlProject(ctx echo.Context) error {
7676

7777
var errMsg string
7878
for _, projectUrl := range urls {
79-
err := logic.DefaultProject.ParseProjectList(strings.TrimSpace(projectUrl))
79+
err := logic.DefaultProject.ParseOneProject(strings.TrimSpace(projectUrl))
8080
if err != nil {
8181
errMsg = err.Error()
8282
}

src/logic/project.go

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,7 @@ import (
2020

2121
"github.com/PuerkitoBio/goquery"
2222
"github.com/lunny/html2md"
23+
"github.com/polaris1119/config"
2324
"github.com/polaris1119/logger"
2425
"golang.org/x/net/context"
2526
)
@@ -264,7 +265,7 @@ const OsChinaDomain = "http://www.oschina.net"
264265
// ProjectLogoPrefix 开源项目 logo 前缀
265266
const ProjectLogoPrefix = "plogo"
266267

267-
var PresetUsernames = []string{"polaris", "blov", "agolangf", "xuanbao"}
268+
var PresetUsernames = config.ConfigFile.MustValueArray("crawl", "preset_users", ",")
268269

269270
// ParseOneProject 处理单个 project
270271
func (ProjectLogic) ParseOneProject(projectUrl string) error {

src/logic/reddit.go

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,7 @@ import (
2121

2222
"github.com/PuerkitoBio/goquery"
2323
"github.com/polaris1119/config"
24+
"github.com/polaris1119/goutils"
2425
"github.com/polaris1119/logger"
2526
)
2627

@@ -85,7 +86,7 @@ func (this *RedditLogic) newDocumentFromResp(url string) (*goquery.Document, err
8586
return goquery.NewDocumentFromResponse(resp)
8687
}
8788

88-
var PresetUids = []int{1, 1747, 1748, 1827}
89+
var PresetUids = config.ConfigFile.MustValueArray("crawl", "preset_uids", ",")
8990

9091
var resourceRe = regexp.MustCompile(`\n\n`)
9192

@@ -177,7 +178,7 @@ func (this *RedditLogic) dealRedditOneResource(contentSelection *goquery.Selecti
177178

178179
resource.Title = title
179180
resource.Url = resourceUrl
180-
resource.Uid = PresetUids[rand.Intn(4)]
181+
resource.Uid = goutils.MustInt(PresetUids[rand.Intn(len(PresetUids))])
181182

182183
ctime := time.Now()
183184
datetime, ok := contentSelection.Find(".tagline time").Attr("datetime")

0 commit comments

Comments
 (0)