Skip to content

Commit

Permalink
extractor modify
Browse files Browse the repository at this point in the history
  • Loading branch information
kaki-admin committed May 8, 2024
1 parent 6f47d12 commit eb9eb15
Show file tree
Hide file tree
Showing 3 changed files with 5 additions and 4 deletions.
3 changes: 2 additions & 1 deletion prerank-stages/extractor/main.go
Original file line number Diff line number Diff line change
Expand Up @@ -50,7 +50,8 @@ func main() {
if rank.RawContent == "" {
continue
}
fullContent, pureContent, _, _, _, _, _, _ := processor.ArticleReadabilityExtractor(rank.RawContent, rank.Url, "", "", true)
//fullContent, pureContent, _, _, _, _, _, _ := processor.ArticleReadabilityExtractor(rank.RawContent, rank.Url, "", "", true)
fullContent, pureContent := processor.ArticleContentExtractor(rank.RawContent, rank.Url, "", "")
var contentLen int
if rank.Language != "zh-cn" {
contentArr := strings.Split(pureContent, " ")
Expand Down
2 changes: 1 addition & 1 deletion prerank-stages/go.mod
Original file line number Diff line number Diff line change
Expand Up @@ -3,7 +3,7 @@ module bytetrade.io/web3os/prerank_stages
go 1.20

require (
github.com/beclab/article-extractor v0.0.2
github.com/beclab/article-extractor v0.0.5
github.com/redis/go-redis/v9 v9.5.1
go.mongodb.org/mongo-driver v1.15.0
go.uber.org/zap v1.27.0
Expand Down
4 changes: 2 additions & 2 deletions prerank-stages/go.sum
Original file line number Diff line number Diff line change
Expand Up @@ -2,8 +2,8 @@ github.com/PuerkitoBio/goquery v1.9.1 h1:mTL6XjbJTZdpfL+Gwl5U2h1l9yEkJjhmlTeV9VP
github.com/PuerkitoBio/goquery v1.9.1/go.mod h1:cW1n6TmIMDoORQU5IU/P1T3tGFunOeXEpGP2WHRwkbY=
github.com/andybalholm/cascadia v1.3.2 h1:3Xi6Dw5lHF15JtdcmAHD3i1+T8plmv7BQ/nsViSLyss=
github.com/andybalholm/cascadia v1.3.2/go.mod h1:7gtRlve5FxPPgIgX36uWBX58OdBsSS6lUvCFb+h7KvU=
github.com/beclab/article-extractor v0.0.2 h1:LGPSv+qAvBtlT40bzLzQNTol6Cex5M4K5EbiZKh25iA=
github.com/beclab/article-extractor v0.0.2/go.mod h1:ih8W3OrtbD586xkigBhfrKWD1GDFXEEbow3uVZ6U/bI=
github.com/beclab/article-extractor v0.0.5 h1:9CQIzS7Rj3qz03jvhXHbzv46PrbkUpgEnIPx40Xtpao=
github.com/beclab/article-extractor v0.0.5/go.mod h1:ih8W3OrtbD586xkigBhfrKWD1GDFXEEbow3uVZ6U/bI=
github.com/bsm/ginkgo/v2 v2.12.0 h1:Ny8MWAHyOepLGlLKYmXG4IEkioBysk6GpaRTLC8zwWs=
github.com/bsm/gomega v1.27.10 h1:yeMWxP2pV2fG3FgAODIY8EiRE3dy0aeFYt4l7wh6yKA=
github.com/cespare/xxhash/v2 v2.2.0 h1:DC2CZ1Ep5Y4k3ZQ899DldepgrayRUGE6BBZ/cd9Cj44=
Expand Down

0 comments on commit eb9eb15

Please sign in to comment.