Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
10 changes: 4 additions & 6 deletions src/art/model.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,10 @@
from .preprocessing.moe_routing import attach_moe_routing_metadata_to_choice
from .trajectories import Trajectory, TrajectoryGroup
from .types import TrainSFTConfig
from .utils.trajectory_logging import write_trajectory_groups_parquet
from .utils.trajectory_logging import (
calculate_step_std_dev,
write_trajectory_groups_parquet,
)

if TYPE_CHECKING:
from wandb.sdk.wandb_run import Run
Expand Down Expand Up @@ -991,11 +994,6 @@ async def log(
group_key = f"group_{metric}"
averages[group_key] = sum(values) / len(values)

# Calculate average standard deviation of rewards within groups
from .utils.old_benchmarking.calculate_step_metrics import (
calculate_step_std_dev,
)

averages[reward_std_dev_key] = calculate_step_std_dev(trajectory_groups)

# Merge in any additional metrics passed directly
Expand Down
3 changes: 1 addition & 2 deletions src/art/utils/benchmarking/aggregate_trajectories.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,8 +21,7 @@ async def load_aggregated_trajectories(
Load trajectories and aggregate metrics at the step level.

This function builds on top of load_trajectories to provide step-level
aggregation similar to load_benchmarked_models, but returns a DataFrame
instead of custom objects.
aggregation as a DataFrame.

Parameters
----------
Expand Down
23 changes: 0 additions & 23 deletions src/art/utils/old_benchmarking/calculate_step_metrics.py

This file was deleted.

11 changes: 0 additions & 11 deletions src/art/utils/old_benchmarking/display_image_grid.py

This file was deleted.

30 changes: 0 additions & 30 deletions src/art/utils/old_benchmarking/generate_comparison_table.py

This file was deleted.

107 changes: 0 additions & 107 deletions src/art/utils/old_benchmarking/generate_line_graphs.py

This file was deleted.

119 changes: 0 additions & 119 deletions src/art/utils/old_benchmarking/load_benchmarked_models.py

This file was deleted.

51 changes: 0 additions & 51 deletions src/art/utils/old_benchmarking/types.py

This file was deleted.

Loading
Loading