代码拉取完成,页面将自动刷新
同步操作将从 Henson/Answer 强制同步,此操作会覆盖自 Fork 仓库以来所做的任何修改,且无法恢复!!!
确定后同步将在后台操作,完成时将刷新页面,请耐心等待。
package Answer
import (
"fmt"
"net/url"
"regexp"
"strings"
"sync"
"github.com/PuerkitoBio/goquery"
"github.com/axgle/mahonia"
"github.com/henson/Answer/util"
"github.com/ngaut/log"
"github.com/yanyiwu/gojieba"
)
//SearchResult 搜索总数跟频率
type SearchResult struct {
Sum int32
Freq int32
}
//GetSearchResult 返回各个搜索引擎返回的结果
func GetSearchResult(question string, answers []string) map[string][]*SearchResult {
if question == "" {
return nil
}
res := make(map[string][]*SearchResult)
res["百度"] = baiduSearch(question, answers)
return res
}
func baiduSearch(question string, answers []string) (result []*SearchResult) {
resultMap := make(map[string]*SearchResult, len(answers))
//搜索题目
searchURL := fmt.Sprintf("http://www.baidu.com/s?wd=%s", url.QueryEscape(question))
questionBody, err := util.HTTPGet(searchURL, 5)
if err != nil {
log.Errorf("search question:%s error", question)
return
}
var wg sync.WaitGroup
for k, answer := range answers {
answer = plainAnswer(answer)
answers[k] = answer
wg.Add(1)
go func(answer string) {
defer wg.Done()
searchResult := new(SearchResult)
//题目搜索结果中包含的答案的数量
searchResult.Freq = int32(strings.Count(string(questionBody), answer))
//题目+结果搜索的总数
keyword := fmt.Sprintf("%s %s", question, answer)
searchURL := fmt.Sprintf("http://www.baidu.com/s?wd=%s", url.QueryEscape(keyword))
body, err := util.HTTPGet(searchURL, 5)
if err != nil {
log.Errorf("search %s error", answer)
} else {
countRe, _ := regexp.Compile(`百度为您找到相关结果约([\d\,]+)`)
result := countRe.FindAllStringSubmatch(string(body), -1)
if len(result) > 0 {
sum := result[0][1]
sum = strings.Replace(sum, ",", "", -1)
searchResult.Sum = util.MustInt32(sum)
}
}
resultMap[answer] = searchResult
}(answer)
}
wg.Wait()
//将map转为slice 方便顺序输出
for _, answer := range answers {
result = append(result, resultMap[answer])
}
return result
}
//plainAnswer 去除答案中的 《》等字符
func plainAnswer(answer string) string {
answer = strings.TrimPrefix(answer, "《")
answer = strings.TrimSuffix(answer, "》")
return answer
}
func knowledge(question string) {
//中文分词,提取关键词
var keywords []string
words := gojieba.NewJieba().Tag(question)
for _, v := range words {
if strings.Contains(v, "/n") {
keywords = append(keywords, strings.Split(v, "/")[0])
}
}
//搜索题目
searchURL := fmt.Sprintf("https://zhidao.baidu.com/search?word=%s", url.QueryEscape(strings.Join(keywords, " ")))
doc, err := goquery.NewDocument(searchURL)
if err != nil {
log.Fatal(err)
}
s := doc.Find("#wgt-autoask")
t := s.Find("#wgt-autoask > dl > dt").Text()
d := s.Find("#wgt-autoask > dl > dd.dd.answer").Text()
dec := mahonia.NewDecoder("gbk")
t = dec.ConvertString(t)
d = dec.ConvertString(d)
d = strings.Replace(d, "\n", "", -1)
d = strings.Replace(d, "推荐答案", "", -1)
d = strings.Replace(d, "[详细]", "", -1)
fmt.Printf("知识图谱推荐答案:%s%s\n", t, d)
}
此处可能存在不合适展示的内容,页面不予展示。您可通过相关编辑功能自查并修改。
如您确认内容无涉及 不当用语 / 纯广告导流 / 暴力 / 低俗色情 / 侵权 / 盗版 / 虚假 / 无价值内容或违法国家有关法律法规的内容,可点击提交进行申诉,我们将尽快为您处理。