Blame view

scripts/evaluation/eval_framework/__init__.py 1.47 KB
c81b0fc1   tangwang   scripts/evaluatio...
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
  """
  Search evaluation framework: pooled relevance annotation, live metrics, batch reports.
  
  Importing this package ensures the project root is on ``sys.path`` (for ``api.*`` imports).
  """
  
  from __future__ import annotations
  
  from .utils import ensure_project_on_path
  
  ensure_project_on_path()
  
  from .constants import (  # noqa: E402
      DEFAULT_ARTIFACT_ROOT,
      DEFAULT_LABELER_MODE,
      DEFAULT_QUERY_FILE,
      JUDGE_PROMPT_VERSION_COMPLEX,
      JUDGE_PROMPT_VERSION_SIMPLE,
      PROJECT_ROOT,
      RELEVANCE_EXACT,
      RELEVANCE_IRRELEVANT,
      RELEVANCE_PARTIAL,
      VALID_LABELS,
  )
  from .framework import SearchEvaluationFramework  # noqa: E402
  from .store import EvalStore, QueryBuildResult  # noqa: E402
  from .cli import build_cli_parser, main  # noqa: E402
  from .web_app import create_web_app  # noqa: E402
  from .reports import render_batch_report_markdown  # noqa: E402
  from .utils import (  # noqa: E402
      ensure_dir,
      sha1_text,
      utc_now_iso,
      utc_timestamp,
  )
  
  __all__ = [
      "DEFAULT_ARTIFACT_ROOT",
      "DEFAULT_LABELER_MODE",
      "DEFAULT_QUERY_FILE",
      "EvalStore",
      "JUDGE_PROMPT_VERSION_COMPLEX",
      "JUDGE_PROMPT_VERSION_SIMPLE",
      "PROJECT_ROOT",
      "QueryBuildResult",
      "RELEVANCE_EXACT",
      "RELEVANCE_IRRELEVANT",
      "RELEVANCE_PARTIAL",
      "SearchEvaluationFramework",
      "VALID_LABELS",
      "build_cli_parser",
      "create_web_app",
      "ensure_dir",
      "main",
      "render_batch_report_markdown",
      "sha1_text",
      "utc_now_iso",
      "utc_timestamp",
  ]