Blame view

scripts/evaluation/tuning/coarse_rank_fusion_space.yaml 4.85 KB
dba57642   tangwang   bayes调参计划
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
  target_path: coarse_rank.fusion
  
  baseline:
    es_bias: 10.0
    es_exponent: 0.05
    text_bias: 0.1
    text_exponent: 0.35
    text_translation_weight: 1.0
    knn_text_weight: 1.0
    knn_image_weight: 2.0
    knn_tie_breaker: 0.3
    knn_bias: 0.2
    knn_exponent: 5.6
    knn_text_bias: 0.2
    knn_text_exponent: 0.0
    knn_image_bias: 0.2
    knn_image_exponent: 0.0
  
  parameters:
    es_bias: {min: 0.3, max: 80.0, scale: log, round: 4}
    es_exponent: {min: 0.0, max: 0.4, scale: linear, round: 4}
    text_bias: {min: 0.001, max: 4.0, scale: log, round: 4}
    text_exponent: {min: 0.02, max: 1.6, scale: linear, round: 4}
    text_translation_weight: {min: 0.1, max: 2.5, scale: linear, round: 4}
    knn_text_weight: {min: 0.1, max: 4.0, scale: linear, round: 4}
    knn_image_weight: {min: 0.1, max: 6.0, scale: linear, round: 4}
    knn_tie_breaker: {min: 0.0, max: 1.0, scale: linear, round: 4}
    knn_bias: {min: 0.001, max: 4.0, scale: log, round: 4}
    knn_exponent: {min: 0.05, max: 12.0, scale: log, round: 4}
    knn_text_bias: {min: 0.001, max: 4.0, scale: log, round: 4}
    knn_text_exponent: {min: 0.0, max: 6.0, scale: linear, round: 4}
    knn_image_bias: {min: 0.001, max: 4.0, scale: log, round: 4}
    knn_image_exponent: {min: 0.0, max: 6.0, scale: linear, round: 4}
  
  seed_experiments:
    - name: seed_knn_soften
      description: 压低 knn 全局指数,先验证当前 5.6 是否过猛
      params:
        text_exponent: 0.42
        knn_image_weight: 1.2
        knn_bias: 0.35
        knn_exponent: 1.4
    - name: seed_text_guard
      description: 提升 lexical 稳定性,抑制翻译与 image knn 过度主导
      params:
        text_exponent: 0.62
        text_translation_weight: 0.75
        knn_image_weight: 1.0
        knn_tie_breaker: 0.15
        knn_exponent: 2.2
    - name: seed_semantic_balanced
      description: 让 text/image knn 都参与,但降低 image 偏置和总指数
      params:
        text_exponent: 0.32
        knn_text_weight: 1.4
        knn_image_weight: 1.8
        knn_tie_breaker: 0.45
        knn_bias: 0.18
        knn_exponent: 3.0
    - name: seed_component_exp
      description: 打开 knn_text/image 子项指数,观察全局 knn_exponent 是否可下放
      params:
        knn_bias: 0.15
        knn_exponent: 1.6
        knn_text_exponent: 0.8
        knn_image_exponent: 0.4
    - name: seed_es_relax
      description: 增强 es 因子的区分度,验证 coarse 是否过分压平 lexical 分数
      params:
        es_bias: 3.0
        es_exponent: 0.11
        text_exponent: 0.48
        knn_exponent: 2.6
    - name: seed_image_heavy
      description: 刻意放大 image knn 做对照,看哪些 query 会明显受损
      params:
        text_exponent: 0.22
        knn_text_weight: 0.9
        knn_image_weight: 3.4
        knn_tie_breaker: 0.55
        knn_bias: 0.12
        knn_exponent: 3.8
    - name: seed_high_knn_global
      description: 沿着 baseline 继续上探更强 knn 全局指数,验证 5.6 是否仍偏保守
      params:
        text_exponent: 0.28
        knn_text_weight: 1.1
        knn_image_weight: 2.6
        knn_tie_breaker: 0.4
        knn_bias: 0.12
        knn_exponent: 7.2
    - name: seed_text_knn_split
      description: 提高 text knn,压低 image knn,同时打开 text/image 子项指数
      params:
        text_exponent: 0.38
        knn_text_weight: 2.0
        knn_image_weight: 0.8
        knn_tie_breaker: 0.2
        knn_bias: 0.08
        knn_exponent: 4.8
        knn_text_exponent: 1.1
        knn_image_exponent: 0.15
    - name: seed_image_split
      description: 保持较高 image 权重,但把非线性拆到 image 子项而不是全局 knn
      params:
        text_exponent: 0.26
        knn_text_weight: 0.9
        knn_image_weight: 3.0
        knn_tie_breaker: 0.35
        knn_bias: 0.08
        knn_exponent: 3.4
        knn_text_exponent: 0.2
        knn_image_exponent: 1.0
    - name: seed_es_text_sharpen
      description: 提升 es 与 lexical 区分度,测试 coarse 是否需要更强文本排序稳定性
      params:
        es_bias: 2.0
        es_exponent: 0.16
        text_bias: 0.03
        text_exponent: 0.78
        text_translation_weight: 0.9
        knn_bias: 0.1
        knn_exponent: 5.0
    - name: seed_translation_discount
      description: 明显削弱 translation 命中,验证抽象 query 是否过度依赖翻译通路
      params:
        text_exponent: 0.44
        text_translation_weight: 0.45
        knn_text_weight: 1.2
        knn_image_weight: 1.7
        knn_tie_breaker: 0.25
        knn_exponent: 5.4
    - name: seed_near_baseline_jitter
      description: 贴近 baseline 做小扰动,优先寻找可行增益而不是只测极端方向
      params:
        es_bias: 8.0
        es_exponent: 0.06
        text_bias: 0.06
        text_exponent: 0.31
        text_translation_weight: 1.1
        knn_text_weight: 1.1
        knn_image_weight: 2.2
        knn_tie_breaker: 0.34
        knn_bias: 0.16
        knn_exponent: 5.9
  
  optimizer:
    init_random: 8
    candidate_pool_size: 512
    explore_probability: 0.28
    local_jitter_probability: 0.42
    elite_fraction: 0.35
    min_normalized_distance: 0.12