new_search (#238)

Co-authored-by: Buf Generate <buf-generate@bondee.com>
This commit is contained in:
Carlo
2025-10-16 21:15:13 +08:00
committed by GitHub
parent c485f1cd49
commit d5138d32bc
8 changed files with 292 additions and 18 deletions

View File

@@ -16,6 +16,131 @@ type SearchResult struct {
} `json:"search"`
}
type FilterOption struct {
FiltersIndex int `json:"filters_index" jsonschema:"筛选组索引 1=排序依据, 2=笔记类型, 3=发布时间, 4=搜索范围, 5=位置距离"`
TagsIndex int `json:"tags_index" jsonschema:"标签索引,根据不同的筛选组索引对应不同的选项: 1=排序依据(1-5), 2=笔记类型(1-3), 3=发布时间(1-4), 4=搜索范围(1-4), 5=位置距离(1-3)"`
Text string `json:"text" jsonschema:"标签文本描述"`
}
// 预定义的筛选选项映射表
var FilterOptionsMap = map[int][]FilterOption{
1: { // 排序依据
{FiltersIndex: 1, TagsIndex: 1, Text: "综合"},
{FiltersIndex: 1, TagsIndex: 2, Text: "最新"},
{FiltersIndex: 1, TagsIndex: 3, Text: "最多点赞"},
{FiltersIndex: 1, TagsIndex: 4, Text: "最多评论"},
{FiltersIndex: 1, TagsIndex: 5, Text: "最多收藏"},
},
2: { // 笔记类型
{FiltersIndex: 2, TagsIndex: 1, Text: "不限"},
{FiltersIndex: 2, TagsIndex: 2, Text: "视频"},
{FiltersIndex: 2, TagsIndex: 3, Text: "图文"},
},
3: { // 发布时间
{FiltersIndex: 3, TagsIndex: 1, Text: "不限"},
{FiltersIndex: 3, TagsIndex: 2, Text: "一天内"},
{FiltersIndex: 3, TagsIndex: 3, Text: "一周内"},
{FiltersIndex: 3, TagsIndex: 4, Text: "半年内"},
},
4: { // 搜索范围
{FiltersIndex: 4, TagsIndex: 1, Text: "不限"},
{FiltersIndex: 4, TagsIndex: 2, Text: "已看过"},
{FiltersIndex: 4, TagsIndex: 3, Text: "未看过"},
{FiltersIndex: 4, TagsIndex: 4, Text: "已关注"},
},
5: { // 位置距离
{FiltersIndex: 5, TagsIndex: 1, Text: "不限"},
{FiltersIndex: 5, TagsIndex: 2, Text: "同城"},
{FiltersIndex: 5, TagsIndex: 3, Text: "附近"},
},
}
// 定义筛选组索引到中文描述的映射
var filterGroupMap = map[int]string{
1: "排序依据",
2: "笔记类型",
3: "发布时间",
4: "搜索范围",
5: "位置距离",
}
// validateFilterOption 验证筛选选项是否在有效范围内
func validateFilterOption(filter FilterOption) error {
// 检查筛选组索引是否有效
if filter.FiltersIndex < 1 || filter.FiltersIndex > 5 {
return fmt.Errorf("无效的筛选组索引 %d有效范围为 1-5", filter.FiltersIndex)
}
// 检查标签索引是否在对应筛选组的有效范围内
options, exists := FilterOptionsMap[filter.FiltersIndex]
if !exists {
return fmt.Errorf("筛选组 %d 不存在", filter.FiltersIndex)
}
if filter.TagsIndex < 1 || filter.TagsIndex > len(options) {
return fmt.Errorf("筛选组 %d 的标签索引 %d 超出范围,有效范围为 1-%d",
filter.FiltersIndex, filter.TagsIndex, len(options))
}
return nil
}
// 便利函数:根据文本创建筛选选项
func NewFilterOption(filtersIndex int, text string) (FilterOption, error) {
options, exists := FilterOptionsMap[filtersIndex]
if !exists {
return FilterOption{}, fmt.Errorf("筛选组 %d 不存在", filtersIndex)
}
for _, option := range options {
if option.Text == text {
return option, nil
}
}
return FilterOption{}, fmt.Errorf("在筛选组 %d 中未找到文本 '%s'", filtersIndex, text)
}
// 便利函数:创建常用的筛选选项
func SortBy(text string) (FilterOption, error) {
return NewFilterOption(1, text) // 排序依据
}
func NoteType(text string) (FilterOption, error) {
return NewFilterOption(2, text) // 笔记类型
}
func TimeRange(text string) (FilterOption, error) {
return NewFilterOption(3, text) // 发布时间
}
func SearchScope(text string) (FilterOption, error) {
return NewFilterOption(4, text) // 搜索范围
}
func LocationDistance(text string) (FilterOption, error) {
return NewFilterOption(5, text) // 位置距离
}
// GetFilterGroupDescription 根据筛选组索引获取中文描述
func GetFilterGroupDescription(index int) string {
if desc, exists := filterGroupMap[index]; exists {
return desc
}
return "未知筛选组"
}
// GetFilterGroupIndex 根据中文描述获取筛选组索引
func GetFilterGroupIndex(text string) int {
// 通过遍历filterGroupMap获取对应的索引
for index, description := range filterGroupMap {
if description == text {
return index
}
}
return -1 // 未找到匹配项时返回-1
}
type SearchAction struct {
page *rod.Page
}
@@ -26,7 +151,7 @@ func NewSearchAction(page *rod.Page) *SearchAction {
return &SearchAction{page: pp}
}
func (s *SearchAction) Search(ctx context.Context, keyword string) ([]Feed, error) {
func (s *SearchAction) Search(ctx context.Context, keyword string, filters ...FilterOption) ([]Feed, error) {
page := s.page.Context(ctx)
searchURL := makeSearchURL(keyword)
@@ -35,6 +160,36 @@ func (s *SearchAction) Search(ctx context.Context, keyword string) ([]Feed, erro
page.MustWait(`() => window.__INITIAL_STATE__ !== undefined`)
// 如果有筛选条件,则应用筛选
if len(filters) > 0 {
// 验证所有筛选选项
for _, filter := range filters {
if err := validateFilterOption(filter); err != nil {
return nil, fmt.Errorf("筛选选项验证失败: %w", err)
}
}
// 悬停在筛选按钮上
filterButton := page.MustElement(`div.filter`)
filterButton.MustHover()
// 等待筛选面板出现
page.MustWait(`() => document.querySelector('div.filter-panel') !== null`)
// 应用所有筛选条件
for _, filter := range filters {
selector := fmt.Sprintf(`div.filter-panel div.filters:nth-child(%d) div.tags:nth-child(%d)`,
filter.FiltersIndex, filter.TagsIndex)
option := page.MustElement(selector)
option.MustClick()
}
// 等待页面更新
page.MustWaitStable()
// 重新等待 __INITIAL_STATE__ 更新
page.MustWait(`() => window.__INITIAL_STATE__ !== undefined`)
}
// 获取 window.__INITIAL_STATE__ 并转换为 JSON 字符串
result := page.MustEval(`() => {
if (window.__INITIAL_STATE__) {
@@ -61,5 +216,7 @@ func makeSearchURL(keyword string) string {
values.Set("keyword", keyword)
values.Set("source", "web_explore_feed")
//https://www.xiaohongshu.com/search_result?keyword=%25E7%258E%258B%25E5%25AD%2590&source=web_search_result_notes
//https://www.xiaohongshu.com/search_result?keyword=%25E7%258E%258B%25E5%25AD%2590&source=web_explore_feed
return fmt.Sprintf("https://www.xiaohongshu.com/search_result?%s", values.Encode())
}