diff --git a/README.md b/README.md index 46c5934..20f0641 100644 --- a/README.md +++ b/README.md @@ -11,5 +11,5 @@ Fetch depth: 1 There files need to be modified while add a new site: - main.go: add entrance url - links.go -> SetLinks(): add case about target urls feature regex, eg: if url must have `about`, param 2 is `.*?about.*` -- post.go -> TreatPost(): add case for new site domain. - site/newsite: copy files from sibling folder, then develop and pass the test. +- post.go -> TreatPost(): add case for new site domain. diff --git a/internal/fetcher/fetcher_test.go b/internal/fetcher/fetcher_test.go index 1f18ce5..1c3b47b 100644 --- a/internal/fetcher/fetcher_test.go +++ b/internal/fetcher/fetcher_test.go @@ -15,7 +15,8 @@ func TestCrawl(t *testing.T) { // "https://www.zaobao.com/news/world", // "https://www.voachinese.com", // "https://www.rfa.org/mandarin/", - "https://news.ltn.com.tw/list/breakingnews", + // "https://news.ltn.com.tw/list/breakingnews", + "https://www.cna.com.tw/list/aall.aspx", }) log.Println("Sleep a sec ...") diff --git a/internal/fetcher/sites/cna/cna.go b/internal/fetcher/sites/cna/cna.go index 45ece75..8e7d5a9 100644 --- a/internal/fetcher/sites/cna/cna.go +++ b/internal/fetcher/sites/cna/cna.go @@ -56,7 +56,7 @@ func setDate(p *Post) error { } tY := cs[0][:4] tM := cs[0][5:7] - tD := cs[0][7:9] + tD := cs[0][8:10] tH := cs[0][11:13] tm := cs[0][14:16] yy, err := strconv.Atoi(tY) diff --git a/internal/fetcher/sites/cna/cna_test.go b/internal/fetcher/sites/cna/cna_test.go index 6720c58..85b6128 100644 --- a/internal/fetcher/sites/cna/cna_test.go +++ b/internal/fetcher/sites/cna/cna_test.go @@ -32,7 +32,7 @@ func TestSetDate(t *testing.T) { if err := setDate(p); err != nil { t.Errorf("test SetPost err: %v", doc) } - want := "2020-08-31T11:49:00+08:00" + want := "2020-09-29T11:49:00+08:00" if p.Date != want { t.Errorf("\ngot: %v\nwant: %v", p.Date, want) }