Skip to content

Commit

Permalink
bug fix
Browse files Browse the repository at this point in the history
  • Loading branch information
Jinnrry committed Aug 3, 2019
1 parent b51e710 commit ddfb549
Show file tree
Hide file tree
Showing 2 changed files with 38 additions and 23 deletions.
7 changes: 7 additions & 0 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,13 @@

[![Home](https://img.shields.io/badge/link-项目主页-brightgreen.svg)](https://jiangwei1995910.github.io/getAwayBSG/)
[![Link](https://img.shields.io/badge/link-python实现-blue.svg)](https://github.com/jiangwei1995910/getAwayBSG/tree/python)
[![Downloads](https://img.shields.io/github/downloads/jiangwei1995910/getAwayBSG/total)](https://img.shields.io/github/downloads/jiangwei1995910/getAwayBSG/total)
[![forks](https://img.shields.io/github/forks/jiangwei1995910/getAwayBSG?style=flat)](https://img.shields.io/github/forks/jiangwei1995910/getAwayBSG?style=flat)
[![starts](https://img.shields.io/github/stars/jiangwei1995910/getAwayBSG)](https://img.shields.io/github/stars/jiangwei1995910/getAwayBSG)
[![license](https://img.shields.io/github/license/jiangwei1995910/getAwayBSG)](https://img.shields.io/github/license/jiangwei1995910/getAwayBSG)
[![issues](https://img.shields.io/github/issues/jiangwei1995910/getAwayBSG)](https://img.shields.io/github/issues/jiangwei1995910/getAwayBSG)
[![version](https://img.shields.io/github/release/jiangwei1995910/getAwayBSG)](https://img.shields.io/github/release/jiangwei1995910/getAwayBSG)



> **注意!**\
Expand Down
54 changes: 31 additions & 23 deletions entrance/lianjia_zufang.go
Original file line number Diff line number Diff line change
Expand Up @@ -150,36 +150,44 @@ func TcrawlerOneCityZuFang(cityUrl string, cityname string) {
goUrl := re.ReplaceAllString(element.Request.URL.String(), "")

err = c.Visit(goUrl + "pg" + strconv.Itoa(i) + "/")
if err.Error() != "URL already visited" {
if err != nil && err.Error() != "URL already visited" {
fmt.Println(err)
}

}
}
})

c.OnHTML(".filter a", func(element *colly.HTMLElement) {
//// 切换地点
u, err := url.Parse(cityUrl)
if err != nil {
panic(err)
}
rootUrl := u.Scheme + "://" + u.Host
goUrl := element.Attr("href")
u, err = url.Parse(goUrl)
if err != nil && err.Error() != "URL already visited" {
fmt.Println(err)
}
if u.Scheme == "" {
goUrl = rootUrl + u.Path
} else {
goUrl = u.String()
}
re, _ := regexp.Compile("pg\\d+/*")
goUrl = re.ReplaceAllString(goUrl, "")
err = c.Visit(goUrl)
if err != nil && err.Error() != "URL already visited" {
fmt.Println(err)
c.OnHTML(".filter ul", func(element *colly.HTMLElement) {

data_target := element.Attr("data-target")

if data_target == "area" {
element.ForEach("a", func(i int, element *colly.HTMLElement) {
//// 切换地点
u, err := url.Parse(cityUrl)
if err != nil {
panic(err)
}
rootUrl := u.Scheme + "://" + u.Host
goUrl := element.Attr("href")
u, err = url.Parse(goUrl)
if err != nil && err.Error() != "URL already visited" {
fmt.Println(err)
}
if u.Scheme == "" {
goUrl = rootUrl + u.Path
} else {
goUrl = u.String()
}
re, _ := regexp.Compile("pg\\d+/*")
goUrl = re.ReplaceAllString(goUrl, "")
err = c.Visit(goUrl)
if err != nil && err.Error() != "URL already visited" {
fmt.Println(err)
}

})
}

})
Expand Down

0 comments on commit ddfb549

Please sign in to comment.