Skip to content

Commit

Permalink
Merge pull request #52 from adamkarvonen/update_scr_tpp
Browse files Browse the repository at this point in the history
update scr_tpp_schema to show top 20 by default
  • Loading branch information
hijohnnylin authored Jan 28, 2025
2 parents 7b2021c + 59320e2 commit f551e7b
Show file tree
Hide file tree
Showing 3 changed files with 6 additions and 2 deletions.
2 changes: 2 additions & 0 deletions sae_bench/evals/scr_and_tpp/eval_output.py
Original file line number Diff line number Diff line change
Expand Up @@ -71,6 +71,7 @@ class ScrMetrics(BaseMetrics):
None,
title="SCR Metric, Top 20 SAE latents",
description="SCR Metric (selecting dir1 if inital profession accuracy is lower than initial gender accuracy, else dir2) ablating the top 20 SAE latents",
json_schema_extra=DEFAULT_DISPLAY,
)
scr_dir2_threshold_20: float | None = Field(
None,
Expand Down Expand Up @@ -324,6 +325,7 @@ class TppMetrics(BaseMetrics):
None,
title="TPP Metric, Top 20 SAE latents",
description="TPP metric when ablating the top 20 SAE latents",
json_schema_extra=DEFAULT_DISPLAY,
)
tpp_threshold_20_intended_diff_only: float | None = Field(
None,
Expand Down
3 changes: 2 additions & 1 deletion sae_bench/evals/scr_and_tpp/eval_output_schema_scr.json
Original file line number Diff line number Diff line change
Expand Up @@ -298,7 +298,8 @@
],
"default": null,
"description": "SCR Metric (selecting dir1 if inital profession accuracy is lower than initial gender accuracy, else dir2) ablating the top 20 SAE latents",
"title": "SCR Metric, Top 20 SAE latents"
"title": "SCR Metric, Top 20 SAE latents",
"ui_default_display": true
},
"scr_dir2_threshold_20": {
"anyOf": [
Expand Down
3 changes: 2 additions & 1 deletion sae_bench/evals/scr_and_tpp/eval_output_schema_tpp.json
Original file line number Diff line number Diff line change
Expand Up @@ -285,7 +285,8 @@
],
"default": null,
"description": "TPP metric when ablating the top 20 SAE latents",
"title": "TPP Metric, Top 20 SAE latents"
"title": "TPP Metric, Top 20 SAE latents",
"ui_default_display": true
},
"tpp_threshold_20_intended_diff_only": {
"anyOf": [
Expand Down

0 comments on commit f551e7b

Please sign in to comment.