Unnamed: 0,autoencoder_group_path,autoencoder_path,reconstruction_file,trainer_class,sae_class,eval_sae_n_inputs,eval_results_n_inputs,board_reconstruction_n_inputs,l0,l1_loss,l2_loss,frac_alive,frac_variance_explained,cossim,l2_ratio,loss_original,loss_reconstructed,loss_zero,frac_recovered,num_alive_features,board_to_piece_state_board_reconstruction_board_count,board_to_piece_state_num_squares,board_to_piece_state_best_idx,board_to_piece_state_zero_L0,board_to_piece_state_best_L0,board_to_piece_state_zero_f1_score_per_class,board_to_piece_state_best_f1_score_per_class,board_to_piece_state_last_f1_score_per_class,board_to_piece_state_zero_num_true_positive_squares,board_to_piece_state_best_num_true_positive_squares,board_to_piece_state_zero_num_false_positive_squares,board_to_piece_state_best_num_false_positive_squares,board_to_piece_state_zero_num_false_negative_squares,board_to_piece_state_best_num_false_negative_squares,board_to_piece_state_zero_multiple_classes,board_to_piece_state_best_multiple_classes,board_to_piece_state_zero_num_true_and_false_positive_squares,board_to_piece_state_best_num_true_and_false_positive_squares,board_to_piece_state_high_precision_counts_per_T,board_to_piece_state_high_precision_and_recall_counts_per_T,board_to_piece_masked_blank_state_board_reconstruction_board_count,board_to_piece_masked_blank_state_num_squares,board_to_piece_masked_blank_state_best_idx,board_to_piece_masked_blank_state_zero_L0,board_to_piece_masked_blank_state_best_L0,board_to_piece_masked_blank_state_zero_f1_score_per_class,board_to_piece_masked_blank_state_best_f1_score_per_class,board_to_piece_masked_blank_state_last_f1_score_per_class,board_to_piece_masked_blank_state_zero_num_true_positive_squares,board_to_piece_masked_blank_state_best_num_true_positive_squares,board_to_piece_masked_blank_state_zero_num_false_positive_squares,board_to_piece_masked_blank_state_best_num_false_positive_squares,board_to_piece_masked_blank_state_zero_num_false_negative_squares,board_to_piece_masked_blank_state_best_num_false_negative_squares,board_to_piece_masked_blank_state_zero_multiple_classes,board_to_piece_masked_blank_state_best_multiple_classes,board_to_piece_masked_blank_state_zero_num_true_and_false_positive_squares,board_to_piece_masked_blank_state_best_num_true_and_false_positive_squares,board_to_piece_masked_blank_state_high_precision_counts_per_T,board_to_piece_masked_blank_state_high_precision_and_recall_counts_per_T,board_to_piece_masked_blank_and_initial_state_board_reconstruction_board_count,board_to_piece_masked_blank_and_initial_state_num_squares,board_to_piece_masked_blank_and_initial_state_best_idx,board_to_piece_masked_blank_and_initial_state_zero_L0,board_to_piece_masked_blank_and_initial_state_best_L0,board_to_piece_masked_blank_and_initial_state_zero_f1_score_per_class,board_to_piece_masked_blank_and_initial_state_best_f1_score_per_class,board_to_piece_masked_blank_and_initial_state_last_f1_score_per_class,board_to_piece_masked_blank_and_initial_state_zero_num_true_positive_squares,board_to_piece_masked_blank_and_initial_state_best_num_true_positive_squares,board_to_piece_masked_blank_and_initial_state_zero_num_false_positive_squares,board_to_piece_masked_blank_and_initial_state_best_num_false_positive_squares,board_to_piece_masked_blank_and_initial_state_zero_num_false_negative_squares,board_to_piece_masked_blank_and_initial_state_best_num_false_negative_squares,board_to_piece_masked_blank_and_initial_state_zero_multiple_classes,board_to_piece_masked_blank_and_initial_state_best_multiple_classes,board_to_piece_masked_blank_and_initial_state_zero_num_true_and_false_positive_squares,board_to_piece_masked_blank_and_initial_state_best_num_true_and_false_positive_squares,board_to_piece_masked_blank_and_initial_state_high_precision_counts_per_T,board_to_piece_masked_blank_and_initial_state_high_precision_and_recall_counts_per_T,board_to_piece_color_state_board_reconstruction_board_count,board_to_piece_color_state_num_squares,board_to_piece_color_state_best_idx,board_to_piece_color_state_zero_L0,board_to_piece_color_state_best_L0,board_to_piece_color_state_zero_f1_score_per_class,board_to_piece_color_state_best_f1_score_per_class,board_to_piece_color_state_last_f1_score_per_class,board_to_piece_color_state_zero_num_true_positive_squares,board_to_piece_color_state_best_num_true_positive_squares,board_to_piece_color_state_zero_num_false_positive_squares,board_to_piece_color_state_best_num_false_positive_squares,board_to_piece_color_state_zero_num_false_negative_squares,board_to_piece_color_state_best_num_false_negative_squares,board_to_piece_color_state_zero_multiple_classes,board_to_piece_color_state_best_multiple_classes,board_to_piece_color_state_zero_num_true_and_false_positive_squares,board_to_piece_color_state_best_num_true_and_false_positive_squares,board_to_piece_color_state_high_precision_counts_per_T,board_to_piece_color_state_high_precision_and_recall_counts_per_T,board_to_pin_state_board_reconstruction_board_count,board_to_pin_state_num_squares,board_to_pin_state_best_idx,board_to_pin_state_zero_L0,board_to_pin_state_best_L0,board_to_pin_state_zero_f1_score_per_class,board_to_pin_state_best_f1_score_per_class,board_to_pin_state_last_f1_score_per_class,board_to_pin_state_zero_num_true_positive_squares,board_to_pin_state_best_num_true_positive_squares,board_to_pin_state_zero_num_false_positive_squares,board_to_pin_state_best_num_false_positive_squares,board_to_pin_state_zero_num_false_negative_squares,board_to_pin_state_best_num_false_negative_squares,board_to_pin_state_zero_multiple_classes,board_to_pin_state_best_multiple_classes,board_to_pin_state_zero_num_true_and_false_positive_squares,board_to_pin_state_best_num_true_and_false_positive_squares,board_to_pin_state_high_precision_counts_per_T,board_to_pin_state_high_precision_and_recall_counts_per_T,board_to_threat_state_board_reconstruction_board_count,board_to_threat_state_num_squares,board_to_threat_state_best_idx,board_to_threat_state_zero_L0,board_to_threat_state_best_L0,board_to_threat_state_zero_f1_score_per_class,board_to_threat_state_best_f1_score_per_class,board_to_threat_state_last_f1_score_per_class,board_to_threat_state_zero_num_true_positive_squares,board_to_threat_state_best_num_true_positive_squares,board_to_threat_state_zero_num_false_positive_squares,board_to_threat_state_best_num_false_positive_squares,board_to_threat_state_zero_num_false_negative_squares,board_to_threat_state_best_num_false_negative_squares,board_to_threat_state_zero_multiple_classes,board_to_threat_state_best_multiple_classes,board_to_threat_state_zero_num_true_and_false_positive_squares,board_to_threat_state_best_num_true_and_false_positive_squares,board_to_threat_state_high_precision_counts_per_T,board_to_threat_state_high_precision_and_recall_counts_per_T,board_to_check_state_board_reconstruction_board_count,board_to_check_state_num_squares,board_to_check_state_best_idx,board_to_check_state_zero_L0,board_to_check_state_best_L0,board_to_check_state_zero_f1_score_per_class,board_to_check_state_best_f1_score_per_class,board_to_check_state_last_f1_score_per_class,board_to_check_state_zero_num_true_positive_squares,board_to_check_state_best_num_true_positive_squares,board_to_check_state_zero_num_false_positive_squares,board_to_check_state_best_num_false_positive_squares,board_to_check_state_zero_num_false_negative_squares,board_to_check_state_best_num_false_negative_squares,board_to_check_state_zero_multiple_classes,board_to_check_state_best_multiple_classes,board_to_check_state_zero_num_true_and_false_positive_squares,board_to_check_state_best_num_true_and_false_positive_squares,board_to_check_state_high_precision_counts_per_T,board_to_check_state_high_precision_and_recall_counts_per_T,board_to_legal_moves_state_board_reconstruction_board_count,board_to_legal_moves_state_num_squares,board_to_legal_moves_state_best_idx,board_to_legal_moves_state_zero_L0,board_to_legal_moves_state_best_L0,board_to_legal_moves_state_zero_f1_score_per_class,board_to_legal_moves_state_best_f1_score_per_class,board_to_legal_moves_state_last_f1_score_per_class,board_to_legal_moves_state_zero_num_true_positive_squares,board_to_legal_moves_state_best_num_true_positive_squares,board_to_legal_moves_state_zero_num_false_positive_squares,board_to_legal_moves_state_best_num_false_positive_squares,board_to_legal_moves_state_zero_num_false_negative_squares,board_to_legal_moves_state_best_num_false_negative_squares,board_to_legal_moves_state_zero_multiple_classes,board_to_legal_moves_state_best_multiple_classes,board_to_legal_moves_state_zero_num_true_and_false_positive_squares,board_to_legal_moves_state_best_num_true_and_false_positive_squares,board_to_legal_moves_state_high_precision_counts_per_T,board_to_legal_moves_state_high_precision_and_recall_counts_per_T,board_to_specific_fork_board_reconstruction_board_count,board_to_specific_fork_num_squares,board_to_specific_fork_best_idx,board_to_specific_fork_zero_L0,board_to_specific_fork_best_L0,board_to_specific_fork_zero_f1_score_per_class,board_to_specific_fork_best_f1_score_per_class,board_to_specific_fork_last_f1_score_per_class,board_to_specific_fork_zero_num_true_positive_squares,board_to_specific_fork_best_num_true_positive_squares,board_to_specific_fork_zero_num_false_positive_squares,board_to_specific_fork_best_num_false_positive_squares,board_to_specific_fork_zero_num_false_negative_squares,board_to_specific_fork_best_num_false_negative_squares,board_to_specific_fork_zero_multiple_classes,board_to_specific_fork_best_multiple_classes,board_to_specific_fork_zero_num_true_and_false_positive_squares,board_to_specific_fork_best_num_true_and_false_positive_squares,board_to_specific_fork_high_precision_counts_per_T,board_to_specific_fork_high_precision_and_recall_counts_per_T,board_to_any_fork_board_reconstruction_board_count,board_to_any_fork_num_squares,board_to_any_fork_best_idx,board_to_any_fork_zero_L0,board_to_any_fork_best_L0,board_to_any_fork_zero_f1_score_per_class,board_to_any_fork_best_f1_score_per_class,board_to_any_fork_last_f1_score_per_class,board_to_any_fork_zero_num_true_positive_squares,board_to_any_fork_best_num_true_positive_squares,board_to_any_fork_zero_num_false_positive_squares,board_to_any_fork_best_num_false_positive_squares,board_to_any_fork_zero_num_false_negative_squares,board_to_any_fork_best_num_false_negative_squares,board_to_any_fork_zero_multiple_classes,board_to_any_fork_best_multiple_classes,board_to_any_fork_zero_num_true_and_false_positive_squares,board_to_any_fork_best_num_true_and_false_positive_squares,board_to_any_fork_high_precision_counts_per_T,board_to_any_fork_high_precision_and_recall_counts_per_T,board_to_has_castling_rights_board_reconstruction_board_count,board_to_has_castling_rights_num_squares,board_to_has_castling_rights_best_idx,board_to_has_castling_rights_zero_L0,board_to_has_castling_rights_best_L0,board_to_has_castling_rights_zero_f1_score_per_class,board_to_has_castling_rights_best_f1_score_per_class,board_to_has_castling_rights_last_f1_score_per_class,board_to_has_castling_rights_zero_num_true_positive_squares,board_to_has_castling_rights_best_num_true_positive_squares,board_to_has_castling_rights_zero_num_false_positive_squares,board_to_has_castling_rights_best_num_false_positive_squares,board_to_has_castling_rights_zero_num_false_negative_squares,board_to_has_castling_rights_best_num_false_negative_squares,board_to_has_castling_rights_zero_multiple_classes,board_to_has_castling_rights_best_multiple_classes,board_to_has_castling_rights_zero_num_true_and_false_positive_squares,board_to_has_castling_rights_best_num_true_and_false_positive_squares,board_to_has_castling_rights_high_precision_counts_per_T,board_to_has_castling_rights_high_precision_and_recall_counts_per_T,board_to_has_queenside_castling_rights_board_reconstruction_board_count,board_to_has_queenside_castling_rights_num_squares,board_to_has_queenside_castling_rights_best_idx,board_to_has_queenside_castling_rights_zero_L0,board_to_has_queenside_castling_rights_best_L0,board_to_has_queenside_castling_rights_zero_f1_score_per_class,board_to_has_queenside_castling_rights_best_f1_score_per_class,board_to_has_queenside_castling_rights_last_f1_score_per_class,board_to_has_queenside_castling_rights_zero_num_true_positive_squares,board_to_has_queenside_castling_rights_best_num_true_positive_squares,board_to_has_queenside_castling_rights_zero_num_false_positive_squares,board_to_has_queenside_castling_rights_best_num_false_positive_squares,board_to_has_queenside_castling_rights_zero_num_false_negative_squares,board_to_has_queenside_castling_rights_best_num_false_negative_squares,board_to_has_queenside_castling_rights_zero_multiple_classes,board_to_has_queenside_castling_rights_best_multiple_classes,board_to_has_queenside_castling_rights_zero_num_true_and_false_positive_squares,board_to_has_queenside_castling_rights_best_num_true_and_false_positive_squares,board_to_has_queenside_castling_rights_high_precision_counts_per_T,board_to_has_queenside_castling_rights_high_precision_and_recall_counts_per_T,board_to_has_kingside_castling_rights_board_reconstruction_board_count,board_to_has_kingside_castling_rights_num_squares,board_to_has_kingside_castling_rights_best_idx,board_to_has_kingside_castling_rights_zero_L0,board_to_has_kingside_castling_rights_best_L0,board_to_has_kingside_castling_rights_zero_f1_score_per_class,board_to_has_kingside_castling_rights_best_f1_score_per_class,board_to_has_kingside_castling_rights_last_f1_score_per_class,board_to_has_kingside_castling_rights_zero_num_true_positive_squares,board_to_has_kingside_castling_rights_best_num_true_positive_squares,board_to_has_kingside_castling_rights_zero_num_false_positive_squares,board_to_has_kingside_castling_rights_best_num_false_positive_squares,board_to_has_kingside_castling_rights_zero_num_false_negative_squares,board_to_has_kingside_castling_rights_best_num_false_negative_squares,board_to_has_kingside_castling_rights_zero_multiple_classes,board_to_has_kingside_castling_rights_best_multiple_classes,board_to_has_kingside_castling_rights_zero_num_true_and_false_positive_squares,board_to_has_kingside_castling_rights_best_num_true_and_false_positive_squares,board_to_has_kingside_castling_rights_high_precision_counts_per_T,board_to_has_kingside_castling_rights_high_precision_and_recall_counts_per_T,board_to_has_legal_en_passant_board_reconstruction_board_count,board_to_has_legal_en_passant_num_squares,board_to_has_legal_en_passant_best_idx,board_to_has_legal_en_passant_zero_L0,board_to_has_legal_en_passant_best_L0,board_to_has_legal_en_passant_zero_f1_score_per_class,board_to_has_legal_en_passant_best_f1_score_per_class,board_to_has_legal_en_passant_last_f1_score_per_class,board_to_has_legal_en_passant_zero_num_true_positive_squares,board_to_has_legal_en_passant_best_num_true_positive_squares,board_to_has_legal_en_passant_zero_num_false_positive_squares,board_to_has_legal_en_passant_best_num_false_positive_squares,board_to_has_legal_en_passant_zero_num_false_negative_squares,board_to_has_legal_en_passant_best_num_false_negative_squares,board_to_has_legal_en_passant_zero_multiple_classes,board_to_has_legal_en_passant_best_multiple_classes,board_to_has_legal_en_passant_zero_num_true_and_false_positive_squares,board_to_has_legal_en_passant_best_num_true_and_false_positive_squares,board_to_has_legal_en_passant_high_precision_counts_per_T,board_to_has_legal_en_passant_high_precision_and_recall_counts_per_T,board_to_pseudo_legal_moves_state_board_reconstruction_board_count,board_to_pseudo_legal_moves_state_num_squares,board_to_pseudo_legal_moves_state_best_idx,board_to_pseudo_legal_moves_state_zero_L0,board_to_pseudo_legal_moves_state_best_L0,board_to_pseudo_legal_moves_state_zero_f1_score_per_class,board_to_pseudo_legal_moves_state_best_f1_score_per_class,board_to_pseudo_legal_moves_state_last_f1_score_per_class,board_to_pseudo_legal_moves_state_zero_num_true_positive_squares,board_to_pseudo_legal_moves_state_best_num_true_positive_squares,board_to_pseudo_legal_moves_state_zero_num_false_positive_squares,board_to_pseudo_legal_moves_state_best_num_false_positive_squares,board_to_pseudo_legal_moves_state_zero_num_false_negative_squares,board_to_pseudo_legal_moves_state_best_num_false_negative_squares,board_to_pseudo_legal_moves_state_zero_multiple_classes,board_to_pseudo_legal_moves_state_best_multiple_classes,board_to_pseudo_legal_moves_state_zero_num_true_and_false_positive_squares,board_to_pseudo_legal_moves_state_best_num_true_and_false_positive_squares,board_to_pseudo_legal_moves_state_high_precision_counts_per_T,board_to_pseudo_legal_moves_state_high_precision_and_recall_counts_per_T,board_to_can_claim_draw_board_reconstruction_board_count,board_to_can_claim_draw_num_squares,board_to_can_claim_draw_best_idx,board_to_can_claim_draw_zero_L0,board_to_can_claim_draw_best_L0,board_to_can_claim_draw_zero_f1_score_per_class,board_to_can_claim_draw_best_f1_score_per_class,board_to_can_claim_draw_last_f1_score_per_class,board_to_can_claim_draw_zero_num_true_positive_squares,board_to_can_claim_draw_best_num_true_positive_squares,board_to_can_claim_draw_zero_num_false_positive_squares,board_to_can_claim_draw_best_num_false_positive_squares,board_to_can_claim_draw_zero_num_false_negative_squares,board_to_can_claim_draw_best_num_false_negative_squares,board_to_can_claim_draw_zero_multiple_classes,board_to_can_claim_draw_best_multiple_classes,board_to_can_claim_draw_zero_num_true_and_false_positive_squares,board_to_can_claim_draw_best_num_true_and_false_positive_squares,board_to_can_claim_draw_high_precision_counts_per_T,board_to_can_claim_draw_high_precision_and_recall_counts_per_T,board_to_can_check_next_board_reconstruction_board_count,board_to_can_check_next_num_squares,board_to_can_check_next_best_idx,board_to_can_check_next_zero_L0,board_to_can_check_next_best_L0,board_to_can_check_next_zero_f1_score_per_class,board_to_can_check_next_best_f1_score_per_class,board_to_can_check_next_last_f1_score_per_class,board_to_can_check_next_zero_num_true_positive_squares,board_to_can_check_next_best_num_true_positive_squares,board_to_can_check_next_zero_num_false_positive_squares,board_to_can_check_next_best_num_false_positive_squares,board_to_can_check_next_zero_num_false_negative_squares,board_to_can_check_next_best_num_false_negative_squares,board_to_can_check_next_zero_multiple_classes,board_to_can_check_next_best_multiple_classes,board_to_can_check_next_zero_num_true_and_false_positive_squares,board_to_can_check_next_best_num_true_and_false_positive_squares,board_to_can_check_next_high_precision_counts_per_T,board_to_can_check_next_high_precision_and_recall_counts_per_T,board_to_has_bishop_pair_board_reconstruction_board_count,board_to_has_bishop_pair_num_squares,board_to_has_bishop_pair_best_idx,board_to_has_bishop_pair_zero_L0,board_to_has_bishop_pair_best_L0,board_to_has_bishop_pair_zero_f1_score_per_class,board_to_has_bishop_pair_best_f1_score_per_class,board_to_has_bishop_pair_last_f1_score_per_class,board_to_has_bishop_pair_zero_num_true_positive_squares,board_to_has_bishop_pair_best_num_true_positive_squares,board_to_has_bishop_pair_zero_num_false_positive_squares,board_to_has_bishop_pair_best_num_false_positive_squares,board_to_has_bishop_pair_zero_num_false_negative_squares,board_to_has_bishop_pair_best_num_false_negative_squares,board_to_has_bishop_pair_zero_multiple_classes,board_to_has_bishop_pair_best_multiple_classes,board_to_has_bishop_pair_zero_num_true_and_false_positive_squares,board_to_has_bishop_pair_best_num_true_and_false_positive_squares,board_to_has_bishop_pair_high_precision_counts_per_T,board_to_has_bishop_pair_high_precision_and_recall_counts_per_T,board_to_has_mate_threat_board_reconstruction_board_count,board_to_has_mate_threat_num_squares,board_to_has_mate_threat_best_idx,board_to_has_mate_threat_zero_L0,board_to_has_mate_threat_best_L0,board_to_has_mate_threat_zero_f1_score_per_class,board_to_has_mate_threat_best_f1_score_per_class,board_to_has_mate_threat_last_f1_score_per_class,board_to_has_mate_threat_zero_num_true_positive_squares,board_to_has_mate_threat_best_num_true_positive_squares,board_to_has_mate_threat_zero_num_false_positive_squares,board_to_has_mate_threat_best_num_false_positive_squares,board_to_has_mate_threat_zero_num_false_negative_squares,board_to_has_mate_threat_best_num_false_negative_squares,board_to_has_mate_threat_zero_multiple_classes,board_to_has_mate_threat_best_multiple_classes,board_to_has_mate_threat_zero_num_true_and_false_positive_squares,board_to_has_mate_threat_best_num_true_and_false_positive_squares,board_to_has_mate_threat_high_precision_counts_per_T,board_to_has_mate_threat_high_precision_and_recall_counts_per_T,board_to_can_capture_queen_board_reconstruction_board_count,board_to_can_capture_queen_num_squares,board_to_can_capture_queen_best_idx,board_to_can_capture_queen_zero_L0,board_to_can_capture_queen_best_L0,board_to_can_capture_queen_zero_f1_score_per_class,board_to_can_capture_queen_best_f1_score_per_class,board_to_can_capture_queen_last_f1_score_per_class,board_to_can_capture_queen_zero_num_true_positive_squares,board_to_can_capture_queen_best_num_true_positive_squares,board_to_can_capture_queen_zero_num_false_positive_squares,board_to_can_capture_queen_best_num_false_positive_squares,board_to_can_capture_queen_zero_num_false_negative_squares,board_to_can_capture_queen_best_num_false_negative_squares,board_to_can_capture_queen_zero_multiple_classes,board_to_can_capture_queen_best_multiple_classes,board_to_can_capture_queen_zero_num_true_and_false_positive_squares,board_to_can_capture_queen_best_num_true_and_false_positive_squares,board_to_can_capture_queen_high_precision_counts_per_T,board_to_can_capture_queen_high_precision_and_recall_counts_per_T,board_to_has_queen_board_reconstruction_board_count,board_to_has_queen_num_squares,board_to_has_queen_best_idx,board_to_has_queen_zero_L0,board_to_has_queen_best_L0,board_to_has_queen_zero_f1_score_per_class,board_to_has_queen_best_f1_score_per_class,board_to_has_queen_last_f1_score_per_class,board_to_has_queen_zero_num_true_positive_squares,board_to_has_queen_best_num_true_positive_squares,board_to_has_queen_zero_num_false_positive_squares,board_to_has_queen_best_num_false_positive_squares,board_to_has_queen_zero_num_false_negative_squares,board_to_has_queen_best_num_false_negative_squares,board_to_has_queen_zero_multiple_classes,board_to_has_queen_best_multiple_classes,board_to_has_queen_zero_num_true_and_false_positive_squares,board_to_has_queen_best_num_true_and_false_positive_squares,board_to_has_queen_high_precision_counts_per_T,board_to_has_queen_high_precision_and_recall_counts_per_T,board_to_has_connected_rooks_board_reconstruction_board_count,board_to_has_connected_rooks_num_squares,board_to_has_connected_rooks_best_idx,board_to_has_connected_rooks_zero_L0,board_to_has_connected_rooks_best_L0,board_to_has_connected_rooks_zero_f1_score_per_class,board_to_has_connected_rooks_best_f1_score_per_class,board_to_has_connected_rooks_last_f1_score_per_class,board_to_has_connected_rooks_zero_num_true_positive_squares,board_to_has_connected_rooks_best_num_true_positive_squares,board_to_has_connected_rooks_zero_num_false_positive_squares,board_to_has_connected_rooks_best_num_false_positive_squares,board_to_has_connected_rooks_zero_num_false_negative_squares,board_to_has_connected_rooks_best_num_false_negative_squares,board_to_has_connected_rooks_zero_multiple_classes,board_to_has_connected_rooks_best_multiple_classes,board_to_has_connected_rooks_zero_num_true_and_false_positive_squares,board_to_has_connected_rooks_best_num_true_and_false_positive_squares,board_to_has_connected_rooks_high_precision_counts_per_T,board_to_has_connected_rooks_high_precision_and_recall_counts_per_T,board_to_ambiguous_moves_board_reconstruction_board_count,board_to_ambiguous_moves_num_squares,board_to_ambiguous_moves_best_idx,board_to_ambiguous_moves_zero_L0,board_to_ambiguous_moves_best_L0,board_to_ambiguous_moves_zero_f1_score_per_class,board_to_ambiguous_moves_best_f1_score_per_class,board_to_ambiguous_moves_last_f1_score_per_class,board_to_ambiguous_moves_zero_num_true_positive_squares,board_to_ambiguous_moves_best_num_true_positive_squares,board_to_ambiguous_moves_zero_num_false_positive_squares,board_to_ambiguous_moves_best_num_false_positive_squares,board_to_ambiguous_moves_zero_num_false_negative_squares,board_to_ambiguous_moves_best_num_false_negative_squares,board_to_ambiguous_moves_zero_multiple_classes,board_to_ambiguous_moves_best_multiple_classes,board_to_ambiguous_moves_zero_num_true_and_false_positive_squares,board_to_ambiguous_moves_best_num_true_and_false_positive_squares,board_to_ambiguous_moves_high_precision_counts_per_T,board_to_ambiguous_moves_high_precision_and_recall_counts_per_T 0,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_0/,autoencoders/matryoshka_chess/trainer_0/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,10.119999885559082,23.24002456665039,2.2731430530548096,0.046875,0.947382390499115,0.949707329273224,0.9537145495414734,0.2971398532390594,0.4201032519340515,3.4657371044158936,0.9611930847167968,3835,20000,1280000,0,14.629825592041016,14.629825592041016,0.6616300940513611,0.6616300940513611,0.7643902897834778,647850,647850,30495,30495,632150,632150,13764,13764,13536,13536,"tensor([12446, 12456, 12339, 12593, 12869, 12449, 12941, 12402, 10309, 5434, 1216], device='cuda:0')","tensor([254, 254, 260, 306, 370, 388, 399, 359, 247, 76, 4], device='cuda:0')",20000,578762,0,14.629825592041016,14.629825592041016,0.7193474173545837,0.7193474173545837,0.7993974089622498,332063,332063,12409,12409,246699,246699,1404,1404,1364,1364,"tensor([4936, 4955, 4917, 5070, 5252, 5073, 5313, 5180, 4504, 2528, 604], device='cuda:0')","tensor([245, 245, 251, 296, 359, 377, 389, 349, 241, 72, 4], device='cuda:0')",20000,221620,3,14.629825592041016,12.867572784423828,0.722435712814331,0.7285798192024231,0.8143664002418518,126993,128308,2956,2286,94627,93312,876,748,856,737,"tensor([538, 539, 548, 617, 733, 779, 807, 739, 567, 237, 50], device='cuda:0')","tensor([243, 243, 249, 294, 357, 376, 389, 349, 241, 72, 4], device='cuda:0')",20000,1280000,0,14.629825592041016,14.629825592041016,0.6890547871589661,0.6890547871589661,0.778552234172821,689143,689143,31113,31113,590857,590857,15593,15593,15574,15574,"tensor([13333, 13334, 13194, 13407, 13603, 13101, 13591, 12955, 10656, 5536, 1216], device='cuda:0')","tensor([207, 210, 213, 224, 230, 229, 210, 181, 111, 31, 0], device='cuda:0')",20000,1922,7,14.629825592041016,3.367624044418335,0.027706516906619,0.0798403173685073,0.1220107451081276,27,80,0,2,1895,1842,0,0,0,0,"tensor([1, 1, 1, 1, 1, 2, 2, 3, 2, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,2,14.629825592041016,14.19711971282959,0.8916904926300049,0.8918077349662781,0.9131327271461488,543435,543382,17214,16988,114803,114856,0,0,0,0,"tensor([17153, 17094, 16889, 16565, 16021, 14844, 14096, 12007, 8399, 3283, 551], device='cuda:0')","tensor([70, 70, 71, 81, 86, 99, 89, 70, 46, 22, 4], device='cuda:0')",20000,392,0,14.629825592041016,14.629825592041016,0.9949238896369934,0.9949238896369934,0.9898989796638488,392,392,4,4,0,0,0,0,0,0,"tensor([14, 14, 14, 18, 15, 13, 11, 8, 5, 2, 0], device='cuda:0')","tensor([14, 14, 14, 18, 15, 13, 11, 8, 5, 2, 0], device='cuda:0')",20000,434590,4,14.629825592041016,10.722323417663574,0.510577917098999,0.5564153790473938,0.6834292411804199,151827,170479,8309,7707,282763,264111,0,0,0,0,"tensor([3225, 3245, 3237, 3385, 3611, 3597, 3870, 3806, 3292, 1732, 362], device='cuda:0')","tensor([26, 26, 26, 30, 36, 40, 43, 32, 30, 15, 0], device='cuda:0')",20000,7,0,14.629825592041016,14.629825592041016,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,14.629825592041016,14.629825592041016,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,0,14.629825592041016,14.629825592041016,0.946526825428009,0.946526825428009,0.9455482959747314,9886,9886,461,461,656,656,0,0,0,0,"tensor([187, 189, 191, 188, 180, 171, 171, 166, 143, 83, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,0,14.629825592041016,14.629825592041016,0.9245850443840028,0.9245850443840028,0.9228684902191162,9385,9385,618,618,913,913,0,0,0,0,"tensor([179, 181, 180, 182, 173, 164, 165, 158, 137, 81, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,0,14.629825592041016,14.629825592041016,0.9394159317016602,0.9394159317016602,0.9376689195632936,9699,9699,625,625,626,626,0,0,0,0,"tensor([184, 186, 188, 186, 179, 169, 169, 166, 142, 83, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,5,14.629825592041016,8.166143417358398,0.0,0.9019608497619628,0.9019608497619628,0,46,0,3,53,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0], device='cuda:0')",20000,443761,4,14.629825592041016,10.722323417663574,0.5570624470710754,0.5821703672409058,0.695736825466156,175002,185655,9540,8387,268759,258106,0,0,0,0,"tensor([3606, 3604, 3596, 3722, 3891, 3837, 4058, 3935, 3376, 1763, 362], device='cuda:0')","tensor([38, 38, 38, 40, 41, 43, 41, 35, 30, 15, 0], device='cuda:0')",20000,0,0,14.629825592041016,14.629825592041016,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,6,14.629825592041016,5.587350368499756,0.0900612100958824,0.1603707373142242,0.2700366675853729,309,571,26,23,6218,5956,0,0,0,0,"tensor([ 9, 9, 8, 10, 15, 14, 14, 16, 15, 13, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,0,14.629825592041016,14.629825592041016,0.7299472689628601,0.7299472689628601,0.7810483574867249,8436,8436,467,467,5775,5775,0,0,0,0,"tensor([257, 258, 253, 256, 248, 234, 230, 207, 177, 94, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,14.629825592041016,14.629825592041016,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,5,14.629825592041016,8.166143417358398,0.525519847869873,0.5404412150382996,0.5961198806762695,139,147,5,12,246,238,0,0,0,0,"tensor([5, 5, 5, 5, 4, 6, 5, 4, 1, 0, 0], device='cuda:0')","tensor([5, 5, 5, 5, 4, 6, 5, 4, 1, 0, 0], device='cuda:0')",20000,18325,3,14.629825592041016,12.867572784423828,0.9650933146476746,0.9661564826965332,0.9616344571113586,18137,18085,1124,1027,188,240,0,0,0,0,"tensor([552, 550, 541, 536, 514, 479, 465, 416, 295, 128, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,6,14.629825592041016,5.587350368499756,0.0,0.0685197189450264,0.0685197189450264,0,106,0,0,2988,2882,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 2, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,6,14.629825592041016,5.587350368499756,0.0191143676638603,0.0541301667690277,0.0975461080670356,60,173,0,1,6158,6045,0,0,0,0,"tensor([2, 2, 2, 3, 3, 4, 5, 5, 6, 5, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 1,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_1/,autoencoders/matryoshka_chess/trainer_1/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,31.920000076293945,36.49705123901367,1.7325013875961304,0.11474609375,0.9698984622955322,0.972705066204071,0.9790810346603394,0.2971398532390594,0.3140596151351928,3.4657371044158936,0.9946601986885072,4062,20000,1280000,3,40.66462707519531,23.72368431091309,0.6190459132194519,0.6855659484863281,0.7940834164619446,591603,682277,39735,28128,688397,597723,6825,12686,6713,12561,"tensor([14499, 13869, 12871, 13465, 13665, 13660, 13779, 14198, 10193, 6038, 1404], device='cuda:0')","tensor([ 70, 75, 152, 226, 286, 302, 315, 298, 187, 56, 6], device='cuda:0')",20000,578762,3,40.66462707519531,23.72368431091309,0.628078818321228,0.7592748999595642,0.8433747887611389,273344,360651,18307,10575,305418,218111,713,1072,698,1062,"tensor([5804, 5726, 5327, 5693, 5826, 5817, 5860, 6072, 4516, 2884, 699], device='cuda:0')","tensor([ 69, 74, 151, 221, 279, 292, 305, 293, 184, 52, 5], device='cuda:0')",20000,221620,3,40.66462707519531,23.72368431091309,0.3245017826557159,0.7338618636131287,0.8349894881248474,43247,129509,1677,1823,178373,92111,81,494,76,489,"tensor([225, 239, 356, 497, 601, 651, 679, 692, 472, 240, 60], device='cuda:0')","tensor([ 68, 71, 147, 219, 277, 291, 305, 293, 184, 52, 5], device='cuda:0')",20000,1280000,2,40.66462707519531,30.77909278869629,0.7029430866241455,0.7258986234664917,0.8144821524620056,717107,748330,43192,33473,562893,531670,13938,17349,13868,17325,"tensor([15526, 14764, 13720, 14270, 14389, 14341, 14425, 14808, 10578, 6125, 1404], device='cuda:0')","tensor([ 96, 110, 165, 203, 209, 209, 194, 161, 89, 25, 2], device='cuda:0')",20000,1922,2,40.66462707519531,30.77909278869629,0.0,0.0693119019269943,0.1016781851649284,0,69,0,0,1922,1853,0,0,0,0,"tensor([0, 0, 1, 1, 1, 2, 2, 2, 1, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,40.66462707519531,23.72368431091309,0.8860848546028137,0.9061773419380188,0.9303321242332458,541284,559772,22221,17448,116954,98466,0,0,0,0,"tensor([22417, 20456, 18496, 17448, 16582, 15631, 14497, 13037, 8158, 3467, 623], device='cuda:0')","tensor([33, 33, 48, 74, 83, 84, 90, 85, 42, 8, 2], device='cuda:0')",20000,392,3,40.66462707519531,23.72368431091309,0.8383404612541199,0.9805447459220886,0.9636135697364808,293,378,14,1,99,14,0,0,0,0,"tensor([16, 16, 19, 20, 16, 15, 11, 9, 4, 0, 0], device='cuda:0')","tensor([16, 16, 19, 20, 16, 15, 11, 9, 4, 0, 0], device='cuda:0')",20000,434590,3,40.66462707519531,23.72368431091309,0.504986047744751,0.5331715941429138,0.6872545480728149,150172,160868,9995,7980,284418,273722,0,0,0,0,"tensor([3527, 3480, 3358, 3673, 3842, 4012, 4096, 4326, 3120, 1816, 427], device='cuda:0')","tensor([ 7, 7, 12, 28, 29, 30, 30, 27, 13, 6, 0], device='cuda:0')",20000,7,0,40.66462707519531,40.66462707519531,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,40.66462707519531,40.66462707519531,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,40.66462707519531,23.72368431091309,0.880484402179718,0.958331286907196,0.9403913617134094,8870,10039,736,370,1672,503,0,0,0,0,"tensor([231, 235, 208, 220, 209, 207, 204, 199, 146, 94, 22], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,0,40.66462707519531,40.66462707519531,0.862500011920929,0.862500011920929,0.9242125153541564,8349,8349,713,713,1949,1949,0,0,0,0,"tensor([223, 225, 201, 208, 201, 197, 195, 194, 143, 94, 22], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,5,40.66462707519531,12.304795265197754,0.8457586765289307,0.9289758801460266,0.9321345090866088,8066,9352,683,457,2259,973,0,0,0,0,"tensor([227, 229, 204, 216, 206, 205, 204, 199, 146, 93, 22], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,40.66462707519531,7.569630146026611,0.0,0.8653846383094788,0.8653846383094788,0,45,0,6,53,8,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0], device='cuda:0')",20000,443761,3,40.66462707519531,23.72368431091309,0.532137930393219,0.5600327253341675,0.7050157189369202,164710,175990,10579,8748,279051,267771,0,0,0,0,"tensor([4079, 3904, 3704, 3995, 4114, 4229, 4265, 4463, 3223, 1852, 427], device='cuda:0')","tensor([11, 11, 15, 31, 32, 34, 29, 27, 13, 6, 0], device='cuda:0')",20000,0,0,40.66462707519531,40.66462707519531,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,2,40.66462707519531,30.77909278869629,0.1631799191236496,0.175239160656929,0.3126191198825836,585,632,58,54,5942,5895,0,0,0,0,"tensor([ 8, 8, 10, 11, 16, 13, 17, 21, 13, 16, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,40.66462707519531,38.18566131591797,0.7809883952140808,0.7879791259765625,0.8233129382133484,9703,9754,934,792,4508,4457,0,0,0,0,"tensor([346, 329, 282, 275, 279, 268, 260, 264, 193, 106, 22], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,40.66462707519531,40.66462707519531,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,8,40.66462707519531,1.352553367614746,0.0,0.3605870008468628,0.5454545617103577,0,86,0,6,385,299,0,0,0,0,"tensor([0, 1, 0, 1, 3, 1, 2, 1, 5, 1, 0], device='cuda:0')","tensor([0, 1, 0, 1, 3, 1, 2, 1, 5, 1, 0], device='cuda:0')",20000,18325,4,40.66462707519531,17.6801700592041,0.9587478041648864,0.9660379886627196,0.9567941427230836,18314,18233,1565,1190,11,92,0,0,0,0,"tensor([697, 629, 553, 539, 525, 507, 492, 447, 297, 138, 22], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,8,40.66462707519531,1.352553367614746,0.0,0.012620392255485,0.012620392255485,0,19,0,4,2988,2969,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,4,40.66462707519531,17.6801700592041,0.0,0.0421715155243873,0.0687519386410713,0,134,0,3,6218,6084,0,0,0,0,"tensor([0, 0, 0, 3, 4, 4, 3, 4, 5, 4, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 2,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_2/,autoencoders/matryoshka_chess/trainer_2/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,53.19999694824219,43.98674392700195,1.5716207027435305,0.157958984375,0.9753849506378174,0.9782140851020812,0.9860661625862122,0.2971398532390594,0.3101760149002075,3.4657371044158936,0.9958857893943788,4048,20000,1280000,3,68.12490844726562,28.005863189697266,0.583165168762207,0.676455557346344,0.7952182292938232,542229,669691,37378,30309,737771,610309,3965,13818,3930,13505,"tensor([14254, 14171, 13272, 13289, 13525, 14080, 14604, 14507, 11651, 6725, 1150], device='cuda:0')","tensor([ 36, 45, 104, 209, 260, 294, 300, 280, 186, 61, 7], device='cuda:0')",20000,578762,3,68.12490844726562,28.005863189697266,0.5656574964523315,0.7383513450622559,0.8383210897445679,234510,345781,15887,12087,344252,232981,163,1389,162,1357,"tensor([5663, 5822, 5554, 5569, 5700, 5913, 6124, 6199, 5188, 3208, 569], device='cuda:0')","tensor([ 34, 43, 100, 200, 251, 283, 289, 272, 180, 59, 7], device='cuda:0')",20000,221620,3,68.12490844726562,28.005863189697266,0.2101207673549652,0.7063115835189819,0.8228605389595032,26124,122443,913,2648,195496,99177,11,558,11,532,"tensor([151, 165, 253, 437, 564, 640, 701, 677, 498, 244, 40], device='cuda:0')","tensor([ 34, 40, 98, 197, 249, 281, 289, 272, 180, 59, 7], device='cuda:0')",20000,1280000,2,68.12490844726562,39.30157852172852,0.6508543491363525,0.7142592668533325,0.817118227481842,638233,730814,42983,35541,641767,549186,7123,17143,7087,17096,"tensor([15262, 15149, 14104, 14120, 14286, 14848, 15362, 15164, 12053, 6839, 1150], device='cuda:0')","tensor([ 58, 82, 146, 195, 195, 195, 179, 151, 97, 29, 0], device='cuda:0')",20000,1922,3,68.12490844726562,28.005863189697266,0.0487062372267246,0.1378977745771408,0.1945996284484863,48,143,1,9,1874,1779,0,0,0,0,"tensor([1, 1, 1, 2, 1, 1, 3, 4, 2, 0, 0], device='cuda:0')","tensor([0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,68.12490844726562,28.005863189697266,0.8252145051956177,0.9006322026252747,0.9275830388069152,476268,554354,19783,18441,181970,103884,0,0,0,0,"tensor([24822, 22189, 19422, 18107, 17083, 16143, 15274, 13097, 8974, 3836, 512], device='cuda:0')","tensor([31, 31, 43, 56, 68, 70, 69, 71, 58, 11, 4], device='cuda:0')",20000,392,2,68.12490844726562,39.30157852172852,0.5754386186599731,0.984924614429474,0.9560975432395936,164,392,14,12,228,0,0,0,0,0,"tensor([13, 13, 24, 24, 19, 16, 16, 13, 8, 2, 0], device='cuda:0')","tensor([13, 13, 24, 24, 19, 16, 16, 13, 8, 2, 0], device='cuda:0')",20000,434590,4,68.12490844726562,19.86624336242676,0.4729049503803253,0.5413203239440918,0.6947263479232788,137460,164278,9293,8085,297130,270312,0,0,0,0,"tensor([3316, 3385, 3358, 3513, 3771, 4084, 4329, 4346, 3525, 2041, 334], device='cuda:0')","tensor([ 3, 4, 10, 20, 22, 25, 25, 24, 18, 5, 0], device='cuda:0')",20000,7,0,68.12490844726562,68.12490844726562,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,68.12490844726562,68.12490844726562,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,68.12490844726562,28.005863189697266,0.8776140213012695,0.9597877860069276,0.9311216473579408,8813,10132,729,439,1729,410,0,0,0,0,"tensor([231, 244, 231, 217, 208, 204, 201, 200, 174, 114, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,2,68.12490844726562,39.30157852172852,0.8152886629104614,0.8749170899391174,0.9209315180778505,7455,8572,535,725,2843,1726,0,0,0,0,"tensor([224, 236, 222, 208, 202, 199, 196, 193, 172, 112, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,68.12490844726562,28.005863189697266,0.856637716293335,0.9514228105545044,0.9262930154800416,8237,9930,669,619,2088,395,0,0,0,0,"tensor([230, 239, 229, 214, 207, 203, 200, 198, 174, 114, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,7,68.12490844726562,3.267620086669922,0.0,0.804347813129425,0.804347813129425,0,37,0,2,53,16,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0], device='cuda:0')",20000,443761,4,68.12490844726562,19.86624336242676,0.508462131023407,0.5773608684539795,0.7189186811447144,154843,183763,10460,9038,288918,259998,0,0,0,0,"tensor([3981, 3953, 3764, 3854, 4059, 4309, 4519, 4506, 3652, 2077, 334], device='cuda:0')","tensor([ 3, 3, 14, 26, 25, 31, 26, 24, 18, 5, 0], device='cuda:0')",20000,0,0,68.12490844726562,68.12490844726562,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,3,68.12490844726562,28.005863189697266,0.0558941587805748,0.1633510738611221,0.3343793153762817,188,583,12,28,6339,5944,0,0,0,0,"tensor([ 4, 4, 9, 8, 12, 17, 19, 23, 19, 20, 4], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,2,68.12490844726562,39.30157852172852,0.7656397223472595,0.7732565402984619,0.8335815668106079,9332,9397,834,697,4879,4814,0,0,0,0,"tensor([341, 338, 301, 273, 261, 272, 270, 277, 224, 125, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,68.12490844726562,68.12490844726562,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,6,68.12490844726562,7.036682605743408,0.0,0.4462151229381561,0.5703970789909363,0,112,0,5,385,273,0,0,0,0,"tensor([0, 1, 1, 2, 1, 2, 3, 3, 5, 2, 0], device='cuda:0')","tensor([0, 1, 1, 2, 1, 2, 3, 3, 5, 2, 0], device='cuda:0')",20000,18325,4,68.12490844726562,19.86624336242676,0.9567511677742004,0.9639160633087158,0.9563198089599608,18317,18205,1648,1243,8,120,0,0,0,0,"tensor([704, 641, 576, 557, 543, 537, 515, 467, 328, 144, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,3,68.12490844726562,28.005863189697266,0.0,0.3322259187698364,0.3351739645004272,0,600,0,24,2988,2388,0,0,0,0,"tensor([0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,6,68.12490844726562,7.036682605743408,0.0,0.0480150654911994,0.0672659575939178,0,153,0,2,6218,6065,0,0,0,0,"tensor([0, 2, 0, 1, 2, 2, 5, 5, 6, 3, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 3,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_3/,autoencoders/matryoshka_chess/trainer_3/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,76.79999542236328,53.29953002929688,1.5074893236160278,0.173095703125,0.9771131873130798,0.9796521663665771,0.988621175289154,0.2971398532390594,0.3102563619613647,3.4657371044158936,0.995860517024994,4004,20000,1280000,3,93.26009368896484,29.69932746887207,0.579240620136261,0.6736525893211365,0.7950837016105652,535938,665205,34547,29715,744062,614795,3980,13445,3929,13228,"tensor([14760, 14899, 13795, 13164, 13358, 13551, 14252, 14255, 11384, 6602, 1129], device='cuda:0')","tensor([ 54, 59, 107, 198, 254, 278, 288, 282, 196, 61, 5], device='cuda:0')",20000,578762,3,93.26009368896484,29.69932746887207,0.5564415454864502,0.7379485368728638,0.8452486395835876,228333,345202,13595,11608,350429,233560,198,1269,198,1249,"tensor([5984, 6192, 5850, 5585, 5652, 5667, 6023, 6115, 5079, 3167, 562], device='cuda:0')","tensor([ 54, 58, 104, 193, 247, 268, 277, 271, 190, 57, 5], device='cuda:0')",20000,221620,4,93.26009368896484,20.01974296569824,0.1961953043937683,0.6788899302482605,0.8204678297042847,24190,114544,781,1281,197430,107076,10,324,10,322,"tensor([183, 201, 287, 453, 556, 612, 660, 652, 492, 257, 47], device='cuda:0')","tensor([ 54, 57, 103, 192, 246, 267, 277, 271, 190, 57, 5], device='cuda:0')",20000,1280000,2,93.26009368896484,44.04977798461914,0.6141149401664734,0.7252715229988098,0.8186386227607727,584159,749625,38283,37532,695841,530375,5780,17867,5765,17803,"tensor([15721, 15828, 14626, 13940, 14159, 14306, 14979, 14887, 11801, 6712, 1129], device='cuda:0')","tensor([ 65, 89, 149, 199, 204, 197, 187, 155, 91, 27, 0], device='cuda:0')",20000,1922,7,93.26009368896484,2.989930868148804,0.0,0.0515933223068714,0.0787244588136673,0,51,0,4,1922,1871,0,0,0,0,"tensor([0, 0, 0, 0, 0, 3, 3, 4, 2, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,93.26009368896484,29.69932746887207,0.8132410645484924,0.8953076601028442,0.92041277885437,464246,548290,19234,18280,193992,109948,0,0,0,0,"tensor([25022, 22565, 19434, 17587, 16825, 15773, 14946, 13104, 8897, 3685, 492], device='cuda:0')","tensor([15, 17, 26, 42, 58, 78, 91, 73, 41, 8, 2], device='cuda:0')",20000,392,2,93.26009368896484,44.04977798461914,0.9285714626312256,0.9936628341674804,0.9631449580192566,351,392,13,5,41,0,0,0,0,0,"tensor([11, 13, 17, 17, 16, 13, 10, 10, 6, 0, 0], device='cuda:0')","tensor([11, 13, 17, 17, 16, 13, 10, 10, 6, 0, 0], device='cuda:0')",20000,434590,4,93.26009368896484,20.01974296569824,0.4818060994148254,0.534999430179596,0.6904559135437012,140724,161496,8838,7638,293866,273094,0,0,0,0,"tensor([3371, 3555, 3577, 3579, 3824, 3897, 4140, 4223, 3475, 2016, 346], device='cuda:0')","tensor([ 5, 6, 17, 23, 26, 23, 26, 22, 19, 6, 0], device='cuda:0')",20000,7,0,93.26009368896484,93.26009368896484,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,93.26009368896484,93.26009368896484,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,93.26009368896484,29.69932746887207,0.8741661310195923,0.96637624502182,0.9368566274642944,8649,10203,597,371,1893,339,0,0,0,0,"tensor([254, 253, 232, 209, 203, 192, 203, 208, 165, 105, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,1,93.26009368896484,68.59728240966797,0.8707680106163025,0.8861027956008911,0.911554992198944,8436,8764,642,719,1862,1534,0,0,0,0,"tensor([242, 241, 227, 204, 198, 184, 199, 200, 162, 105, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,93.26009368896484,29.69932746887207,0.8475366830825806,0.957950234413147,0.9288612604141236,7991,10001,541,554,2334,324,0,0,0,0,"tensor([250, 251, 230, 207, 202, 191, 202, 205, 164, 105, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,93.26009368896484,6.457205295562744,0.0,0.7835051417350769,0.8316831588745117,0,38,0,6,53,15,0,0,0,0,"tensor([0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0], device='cuda:0')",20000,443761,3,93.26009368896484,29.69932746887207,0.5105890035629272,0.5576387047767639,0.7111286520957947,155518,175057,9892,9033,288243,268704,0,0,0,0,"tensor([4056, 4128, 3986, 3886, 4077, 4141, 4326, 4405, 3572, 2039, 346], device='cuda:0')","tensor([ 8, 9, 23, 23, 28, 24, 26, 22, 19, 6, 0], device='cuda:0')",20000,0,0,93.26009368896484,93.26009368896484,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,2,93.26009368896484,44.04977798461914,0.172571912407875,0.1953360587358474,0.3220746219158172,621,712,49,51,5906,5815,0,0,0,0,"tensor([ 7, 9, 10, 11, 13, 13, 11, 13, 15, 15, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,0,93.26009368896484,93.26009368896484,0.7814031839370728,0.7814031839370728,0.8225396871566772,9807,9807,1083,1083,4404,4404,0,0,0,0,"tensor([360, 354, 308, 267, 265, 254, 263, 269, 216, 114, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,93.26009368896484,93.26009368896484,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,7,93.26009368896484,2.989930868148804,0.0648379027843475,0.3716075420379638,0.5510948896408081,13,89,3,5,372,296,0,0,0,0,"tensor([1, 1, 1, 2, 1, 4, 4, 2, 2, 2, 0], device='cuda:0')","tensor([1, 1, 1, 2, 1, 4, 4, 2, 2, 2, 0], device='cuda:0')",20000,18325,4,93.26009368896484,20.01974296569824,0.9564876556396484,0.9623576402664183,0.9562948346138,18322,18254,1664,1357,3,71,0,0,0,0,"tensor([699, 656, 560, 535, 531, 526, 511, 477, 338, 140, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,3,93.26009368896484,29.69932746887207,0.0,0.2840135991573334,0.2840135991573334,0,501,0,39,2988,2487,0,0,0,0,"tensor([0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,8,93.26009368896484,1.2228978872299194,0.0,0.0244483258575201,0.049522016197443,0,77,0,4,6218,6141,0,0,0,0,"tensor([0, 0, 0, 1, 1, 2, 2, 2, 4, 2, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 4,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_4/,autoencoders/matryoshka_chess/trainer_4/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,96.95999908447266,59.37613677978516,1.4183404445648191,0.183837890625,0.9799119830131532,0.9818909764289856,0.9926769733428956,0.2971398532390594,0.3061265051364898,3.4657371044158936,0.9971638321876526,3872,20000,1280000,3,119.78266143798828,31.373136520385746,0.5676613450050354,0.6465390920639038,0.7789537310600281,519025,625193,29618,28775,760975,654807,3960,11622,3915,11406,"tensor([12559, 13238, 12727, 12619, 12775, 12788, 13463, 12700, 10192, 6190, 1598], device='cuda:0')","tensor([ 46, 52, 94, 175, 235, 257, 256, 228, 164, 58, 5], device='cuda:0')",20000,578762,4,119.78266143798828,20.28169631958008,0.5450129508972168,0.6938215494155884,0.81992506980896,220915,312432,11001,9418,357847,266330,232,917,216,898,"tensor([5171, 5499, 5361, 5326, 5499, 5451, 5701, 5460, 4511, 2939, 795], device='cuda:0')","tensor([ 42, 48, 88, 168, 229, 246, 247, 221, 160, 54, 4], device='cuda:0')",20000,221620,4,119.78266143798828,20.28169631958008,0.203637033700943,0.6494051814079285,0.7951791882514954,25229,107297,935,1530,196391,114323,21,381,21,375,"tensor([195, 208, 291, 439, 555, 598, 637, 572, 451, 252, 71], device='cuda:0')","tensor([ 42, 45, 87, 167, 227, 244, 247, 221, 160, 54, 4], device='cuda:0')",20000,1280000,3,119.78266143798828,31.373136520385746,0.5960858464241028,0.7002143859863281,0.808163583278656,557250,706266,32447,31019,722750,573734,4930,15216,4922,15186,"tensor([13308, 14019, 13450, 13317, 13426, 13431, 14119, 13257, 10564, 6278, 1598], device='cuda:0')","tensor([ 59, 71, 133, 164, 166, 168, 157, 121, 85, 24, 1], device='cuda:0')",20000,1922,7,119.78266143798828,3.046278476715088,0.0,0.0397756285965442,0.0701051577925682,0,39,0,0,1922,1883,0,0,0,0,"tensor([0, 0, 1, 1, 1, 1, 3, 3, 2, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,119.78266143798828,31.373136520385746,0.7313641309738159,0.8877383470535278,0.8650382161140442,389089,539839,16682,18135,269149,118399,0,0,0,0,"tensor([21981, 20599, 18121, 16611, 15525, 14686, 13931, 11648, 8090, 3578, 711], device='cuda:0')","tensor([34, 34, 48, 58, 66, 64, 83, 66, 43, 9, 2], device='cuda:0')",20000,392,3,119.78266143798828,31.373136520385746,0.7588325142860413,0.9897436499595642,0.9300118684768676,247,386,12,2,145,6,0,0,0,0,"tensor([ 7, 7, 11, 13, 13, 14, 12, 12, 7, 2, 0], device='cuda:0')","tensor([ 7, 7, 11, 13, 13, 14, 12, 12, 7, 2, 0], device='cuda:0')",20000,434590,4,119.78266143798828,20.28169631958008,0.4881059229373932,0.5292680263519287,0.6776451468467712,142852,159139,7890,7626,291738,275451,0,0,0,0,"tensor([3138, 3315, 3338, 3446, 3678, 3754, 4004, 3811, 3105, 1876, 479], device='cuda:0')","tensor([ 9, 9, 18, 24, 24, 24, 20, 19, 13, 6, 0], device='cuda:0')",20000,7,0,119.78266143798828,119.78266143798828,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,119.78266143798828,119.78266143798828,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,119.78266143798828,31.373136520385746,0.8483263850212097,0.9620217084884644,0.9397655129432678,8110,10183,468,445,2432,359,0,0,0,0,"tensor([210, 217, 208, 197, 193, 178, 185, 182, 144, 94, 25], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,119.78266143798828,12.469648361206056,0.809918224811554,0.8404179811477661,0.9139919877052308,7333,7681,477,300,2965,2617,0,0,0,0,"tensor([204, 209, 201, 191, 187, 172, 178, 181, 141, 94, 25], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,119.78266143798828,31.373136520385746,0.8171935677528381,0.9534906148910522,0.933752179145813,7405,9984,393,633,2920,341,0,0,0,0,"tensor([209, 214, 206, 196, 193, 178, 184, 182, 144, 94, 25], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,119.78266143798828,7.116698741912842,0.0,0.8282828330993652,0.8282828330993652,0,41,0,5,53,12,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')",20000,443761,3,119.78266143798828,31.373136520385746,0.508215069770813,0.5525027513504028,0.6984900832176208,154195,172756,8854,8841,289566,271005,0,0,0,0,"tensor([3519, 3740, 3681, 3730, 3900, 3955, 4198, 3938, 3189, 1906, 479], device='cuda:0')","tensor([11, 11, 19, 24, 24, 27, 23, 19, 13, 6, 0], device='cuda:0')",20000,0,0,119.78266143798828,119.78266143798828,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,6,119.78266143798828,7.116698741912842,0.0348714850842952,0.1447592079639434,0.2581155896186828,116,511,10,22,6411,6016,0,0,0,0,"tensor([ 5, 4, 12, 14, 13, 16, 15, 19, 18, 18, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,119.78266143798828,82.27289581298828,0.7277688980102539,0.7439023852348328,0.8142390847206116,8401,8723,475,518,5810,5488,0,0,0,0,"tensor([274, 284, 262, 245, 248, 244, 242, 230, 195, 108, 25], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,119.78266143798828,119.78266143798828,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,7,119.78266143798828,3.046278476715088,0.0,0.3747368454933166,0.4715127944946289,0,89,0,1,385,296,0,0,0,0,"tensor([0, 0, 0, 1, 1, 2, 1, 3, 2, 0, 0], device='cuda:0')","tensor([0, 0, 0, 1, 1, 2, 1, 3, 2, 0, 0], device='cuda:0')",20000,18325,4,119.78266143798828,20.28169631958008,0.9576772451400756,0.9614313840866088,0.9563198089599608,18306,18297,1599,1440,19,28,0,0,0,0,"tensor([547, 565, 524, 517, 488, 468, 473, 421, 299, 136, 25], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,6,119.78266143798828,7.116698741912842,0.0,0.0172413792461156,0.0172413792461156,0,26,0,2,2988,2962,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,6,119.78266143798828,7.116698741912842,0.0,0.039666298776865,0.0679069757461547,0,126,0,9,6218,6092,0,0,0,0,"tensor([0, 0, 1, 2, 2, 2, 4, 5, 3, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 5,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_5/,autoencoders/matryoshka_chess/trainer_5/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,118.27999877929688,67.23790740966797,1.361075758934021,0.1796875,0.9817731380462646,0.9840524196624756,0.9943403601646424,0.2971398532390594,0.3061086535453796,3.4657371044158936,0.9971694350242616,3636,20000,1280000,3,145.4110870361328,32.286842346191406,0.531870424747467,0.6225016117095947,0.7555956840515137,472123,590726,23208,27184,807877,689274,2433,7624,2415,7492,"tensor([10442, 11398, 11048, 11504, 11175, 11366, 12287, 11462, 9513, 5117, 1152], device='cuda:0')","tensor([ 55, 54, 85, 163, 207, 237, 248, 224, 152, 49, 4], device='cuda:0')",20000,578762,3,145.4110870361328,32.286842346191406,0.5013353824615479,0.6720630526542664,0.7983182668685913,196252,298479,7903,11006,382510,280283,183,777,181,740,"tensor([4372, 4767, 4685, 4882, 4694, 4715, 5111, 4877, 4231, 2438, 576], device='cuda:0')","tensor([ 54, 53, 83, 159, 203, 229, 240, 216, 147, 48, 4], device='cuda:0')",20000,221620,4,145.4110870361328,19.53734397888184,0.1638856083154678,0.588313102722168,0.7474048137664795,19864,92947,929,1411,201756,128673,42,354,42,351,"tensor([209, 210, 273, 412, 497, 551, 601, 537, 427, 216, 48], device='cuda:0')","tensor([ 54, 53, 82, 157, 202, 228, 240, 216, 147, 48, 4], device='cuda:0')",20000,1280000,3,145.4110870361328,32.286842346191406,0.5614351034164429,0.6721416115760803,0.7890010476112366,509440,662402,25338,28617,770560,617598,3782,12228,3779,12207,"tensor([11058, 12071, 11661, 12133, 11770, 12004, 12903, 11994, 9859, 5200, 1152], device='cuda:0')","tensor([ 55, 71, 107, 150, 158, 154, 147, 119, 66, 16, 0], device='cuda:0')",20000,1922,4,145.4110870361328,19.53734397888184,0.0,0.0700700655579567,0.1525261998176574,0,70,0,6,1922,1852,0,0,0,0,"tensor([0, 0, 0, 1, 2, 2, 3, 3, 2, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,2,145.4110870361328,54.60490036010742,0.6161924600601196,0.8662944436073303,0.773444652557373,299370,517465,14069,18960,358868,140773,0,0,0,0,"tensor([19475, 18748, 16819, 15891, 14656, 13815, 12872, 10738, 7170, 2900, 499], device='cuda:0')","tensor([26, 28, 31, 45, 57, 73, 71, 63, 36, 7, 0], device='cuda:0')",20000,392,3,145.4110870361328,32.286842346191406,0.9020689725875854,0.996178388595581,0.9861635565757751,327,391,6,2,65,1,0,0,0,0,"tensor([ 8, 9, 10, 11, 10, 10, 8, 8, 3, 3, 0], device='cuda:0')","tensor([ 8, 9, 10, 11, 10, 10, 8, 8, 3, 3, 0], device='cuda:0')",20000,434590,4,145.4110870361328,19.53734397888184,0.4588482677936554,0.5080815553665161,0.6548886895179749,131268,150431,6305,7132,303322,284159,0,0,0,0,"tensor([2784, 2924, 3022, 3247, 3242, 3360, 3664, 3486, 2969, 1556, 345], device='cuda:0')","tensor([ 4, 4, 11, 16, 19, 16, 17, 17, 12, 1, 0], device='cuda:0')",20000,7,0,145.4110870361328,145.4110870361328,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,145.4110870361328,145.4110870361328,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,145.4110870361328,32.286842346191406,0.8208450675010681,0.9605659246444702,0.9402523040771484,7537,10048,285,331,3005,494,0,0,0,0,"tensor([178, 196, 175, 175, 164, 155, 161, 156, 138, 81, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,145.4110870361328,11.38952922821045,0.7903760075569153,0.812870442867279,0.9039525985717772,6915,7200,285,217,3383,3098,0,0,0,0,"tensor([173, 191, 169, 169, 157, 150, 155, 150, 135, 80, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,145.4110870361328,32.286842346191406,0.7941929697990417,0.9534084796905518,0.9324072599411012,6975,9853,265,491,3350,472,0,0,0,0,"tensor([176, 193, 173, 171, 162, 152, 159, 155, 137, 81, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,7,145.4110870361328,2.6133244037628174,0.0,0.6511628031730652,0.6511628031730652,0,28,0,5,53,25,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0], device='cuda:0')",20000,443761,4,145.4110870361328,19.53734397888184,0.4830166399478912,0.5224257111549377,0.6717514395713806,143689,159530,7515,7437,300072,284231,0,0,0,0,"tensor([2998, 3258, 3284, 3504, 3469, 3560, 3862, 3618, 3036, 1598, 345], device='cuda:0')","tensor([ 5, 5, 15, 20, 18, 15, 17, 17, 12, 1, 0], device='cuda:0')",20000,0,0,145.4110870361328,145.4110870361328,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,4,145.4110870361328,19.53734397888184,0.0934769958257675,0.148514837026596,0.2858626544475555,321,525,20,18,6206,6002,0,0,0,0,"tensor([ 8, 7, 6, 9, 13, 14, 19, 21, 17, 18, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,145.4110870361328,96.36578369140624,0.7179486751556396,0.742553174495697,0.8169540762901306,8162,8725,364,564,6049,5486,0,0,0,0,"tensor([225, 246, 230, 231, 209, 206, 215, 213, 179, 93, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,145.4110870361328,145.4110870361328,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,2,145.4110870361328,54.60490036010742,0.0,0.402414470911026,0.5605786442756653,0,100,0,12,385,285,0,0,0,0,"tensor([0, 0, 2, 1, 1, 3, 3, 1, 1, 1, 0], device='cuda:0')","tensor([0, 0, 2, 1, 1, 3, 3, 1, 1, 1, 0], device='cuda:0')",20000,18325,3,145.4110870361328,32.286842346191406,0.9575552344322203,0.9593260884284972,0.9563198089599608,18127,18279,1409,1504,198,46,0,0,0,0,"tensor([432, 480, 452, 456, 446, 444, 434, 392, 273, 108, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,145.4110870361328,145.4110870361328,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,7,145.4110870361328,2.6133244037628174,0.0,0.0400315225124359,0.0700992569327354,0,127,0,0,6218,6091,0,0,0,0,"tensor([0, 0, 1, 3, 3, 4, 5, 5, 4, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 6,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_6/,autoencoders/matryoshka_chess/trainer_6/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,140.1999969482422,78.34004211425781,1.2821279764175415,0.1787109375,0.9835570454597472,0.9856407046318054,0.9945541024208068,0.2971398532390594,0.3041818737983703,3.4657371044158936,0.9977775812149048,3355,20000,1280000,3,170.7425537109375,35.74299240112305,0.5114122033119202,0.6029230356216431,0.7391892075538635,446526,562633,19721,23718,833474,717367,2822,7489,2793,7369,"tensor([ 9202, 10563, 10142, 10541, 10816, 11358, 11694, 10891, 8726, 5242, 1088], device='cuda:0')","tensor([ 58, 60, 83, 134, 162, 194, 197, 170, 116, 42, 6], device='cuda:0')",20000,578762,3,170.7425537109375,35.74299240112305,0.4803441166877746,0.6498228311538696,0.776003897190094,184914,283043,6247,9334,393848,295719,191,637,181,632,"tensor([3906, 4448, 4327, 4591, 4668, 4826, 4976, 4742, 3939, 2527, 544], device='cuda:0')","tensor([ 56, 58, 81, 129, 155, 183, 187, 160, 111, 38, 3], device='cuda:0')",20000,221620,3,170.7425537109375,35.74299240112305,0.1788605898618698,0.5407550930976868,0.709592342376709,21848,82828,834,1894,199772,138792,13,389,13,388,"tensor([225, 235, 276, 388, 451, 507, 532, 464, 368, 206, 42], device='cuda:0')","tensor([ 56, 57, 79, 128, 154, 182, 187, 160, 111, 38, 3], device='cuda:0')",20000,1280000,3,170.7425537109375,35.74299240112305,0.5347838997840881,0.6540360450744629,0.7723010182380676,474959,634482,21306,25723,805041,645518,3383,11134,3376,11101,"tensor([ 9727, 11160, 10689, 11038, 11340, 11871, 12237, 11334, 9013, 5301, 1088], device='cuda:0')","tensor([ 56, 65, 94, 118, 122, 127, 122, 99, 58, 15, 3], device='cuda:0')",20000,1922,3,170.7425537109375,35.74299240112305,0.0,0.0882061421871185,0.1341698765754699,0,89,0,7,1922,1833,0,0,0,0,"tensor([0, 0, 0, 1, 0, 2, 2, 2, 2, 1, 0], device='cuda:0')","tensor([0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,170.7425537109375,35.74299240112305,0.5138603448867798,0.867509126663208,0.703855037689209,231704,518050,11875,18051,426534,140188,0,0,0,0,"tensor([17293, 17028, 15104, 14175, 13457, 12738, 11672, 9198, 6172, 2798, 459], device='cuda:0')","tensor([40, 38, 42, 42, 50, 58, 50, 43, 25, 5, 0], device='cuda:0')",20000,392,3,170.7425537109375,35.74299240112305,0.7796609997749329,0.9936467409133912,0.9836477637290956,253,391,4,4,139,1,0,0,0,0,"tensor([8, 8, 8, 9, 8, 9, 7, 7, 4, 1, 0], device='cuda:0')","tensor([8, 8, 8, 9, 8, 9, 7, 7, 4, 1, 0], device='cuda:0')",20000,434590,5,170.7425537109375,11.38751983642578,0.4427096545696258,0.4872436821460724,0.6307920217514038,125187,141909,5772,5998,309403,292681,0,0,0,0,"tensor([2588, 2863, 2773, 3023, 3252, 3440, 3528, 3313, 2646, 1598, 320], device='cuda:0')","tensor([ 7, 7, 7, 18, 19, 18, 17, 14, 9, 5, 0], device='cuda:0')",20000,7,0,170.7425537109375,170.7425537109375,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,170.7425537109375,170.7425537109375,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,170.7425537109375,20.43633270263672,0.7254564166069031,0.94851553440094,0.941234827041626,6100,9792,175,313,4442,750,0,0,0,0,"tensor([153, 171, 162, 163, 161, 157, 150, 152, 126, 81, 17], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,170.7425537109375,11.38751983642578,0.6806468367576599,0.8562621474266052,0.8990974426269531,5388,7917,146,277,4910,2381,0,0,0,0,"tensor([147, 164, 156, 160, 157, 153, 145, 149, 124, 80, 17], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,170.7425537109375,20.43633270263672,0.734337329864502,0.9445912837982178,0.932847023010254,6095,9649,180,456,4230,676,0,0,0,0,"tensor([153, 171, 162, 163, 161, 156, 150, 152, 126, 80, 17], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,170.7425537109375,6.027648448944092,0.0,0.6511628031730652,0.6511628031730652,0,28,0,5,53,25,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')",20000,443761,3,170.7425537109375,35.74299240112305,0.4623453617095947,0.496218204498291,0.646458625793457,135485,148662,6831,6757,308276,295099,0,0,0,0,"tensor([2727, 3120, 3025, 3225, 3396, 3624, 3731, 3436, 2701, 1630, 320], device='cuda:0')","tensor([ 6, 6, 6, 17, 18, 17, 17, 15, 9, 5, 0], device='cuda:0')",20000,0,0,170.7425537109375,170.7425537109375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,4,170.7425537109375,20.43633270263672,0.0381266921758651,0.146659106016159,0.237197458744049,127,518,8,19,6400,6009,0,0,0,0,"tensor([ 4, 4, 4, 9, 15, 19, 18, 20, 15, 14, 4], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,5,170.7425537109375,11.38751983642578,0.666881263256073,0.7338740825653076,0.8063177466392517,7252,8550,286,540,6959,5661,0,0,0,0,"tensor([193, 220, 205, 208, 205, 206, 209, 200, 159, 89, 17], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,170.7425537109375,170.7425537109375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,5,170.7425537109375,11.38751983642578,0.0,0.2258064448833465,0.3815513849258423,0,49,0,0,385,336,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 1, 2, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 1, 2, 1, 0, 0], device='cuda:0')",20000,18325,3,170.7425537109375,35.74299240112305,0.956872820854187,0.9591462016105652,0.9563198089599608,18127,18289,1436,1522,198,36,0,0,0,0,"tensor([375, 436, 403, 400, 405, 418, 411, 339, 228, 109, 17], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,8,170.7425537109375,0.97568941116333,0.0,0.0079840319231152,0.0079840319231152,0,12,0,6,2988,2976,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,7,170.7425537109375,2.5184152126312256,0.0203691907227039,0.0443187169730663,0.0673181265592575,64,141,2,4,6154,6077,0,0,0,0,"tensor([2, 2, 1, 2, 3, 4, 5, 8, 5, 2, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 7,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_7/,autoencoders/matryoshka_chess/trainer_7/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,162.67999267578125,91.28782653808594,1.2322967052459717,0.17919921875,0.9852133989334106,0.9871873259544371,0.9962756037712096,0.2971398532390594,0.3002977073192596,3.4657371044158936,0.9990034103393556,3027,20000,1280000,3,197.6445159912109,36.49449920654297,0.4830027222633362,0.5555539131164551,0.7109944224357605,412622,500178,15948,20468,867378,779822,2204,4587,2191,4518,"tensor([ 8789, 10008, 9924, 9443, 9193, 9605, 10221, 9672, 7833, 4602, 960], device='cuda:0')","tensor([ 52, 53, 70, 104, 129, 147, 160, 156, 109, 42, 4], device='cuda:0')",20000,578762,4,197.6445159912109,19.995819091796875,0.4485375583171844,0.5701121687889099,0.7397025227546692,168732,232990,4871,5596,410030,345772,36,282,35,281,"tensor([3915, 4369, 4398, 4146, 3968, 4105, 4329, 4229, 3602, 2222, 480], device='cuda:0')","tensor([ 48, 49, 66, 99, 122, 137, 149, 147, 101, 36, 3], device='cuda:0')",20000,221620,4,197.6445159912109,19.995819091796875,0.1273237019777298,0.5040509700775146,0.6698627471923828,15106,74905,559,687,206514,146715,18,113,18,113,"tensor([241, 248, 278, 333, 363, 402, 420, 407, 335, 186, 38], device='cuda:0')","tensor([ 48, 49, 66, 98, 122, 136, 148, 147, 101, 36, 3], device='cuda:0')",20000,1280000,3,197.6445159912109,36.49449920654297,0.5038016438484192,0.612258791923523,0.7494068741798401,436795,574468,17201,22085,843205,705532,2768,7909,2768,7895,"tensor([ 9164, 10473, 10329, 9824, 9600, 10036, 10716, 10075, 8058, 4653, 960], device='cuda:0')","tensor([ 64, 68, 95, 101, 101, 98, 100, 87, 50, 20, 1], device='cuda:0')",20000,1922,6,197.6445159912109,5.190147399902344,0.0407124683260917,0.0427698567509651,0.0864811092615127,40,42,3,0,1882,1880,0,0,0,0,"tensor([1, 1, 1, 1, 1, 1, 2, 3, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,197.6445159912109,36.49449920654297,0.4653086960315704,0.8565294146537781,0.6596480011940002,202621,505289,10051,16325,455617,152949,0,0,0,0,"tensor([16066, 15836, 14106, 12967, 11971, 11337, 10414, 8373, 5489, 2448, 413], device='cuda:0')","tensor([48, 48, 48, 44, 43, 46, 33, 34, 21, 10, 0], device='cuda:0')",20000,392,3,197.6445159912109,36.49449920654297,0.5290806889533997,0.9936628341674804,0.991150438785553,141,392,0,5,251,0,0,0,0,0,"tensor([2, 2, 4, 5, 6, 6, 6, 5, 3, 1, 0], device='cuda:0')","tensor([2, 2, 4, 5, 6, 6, 6, 5, 3, 1, 0], device='cuda:0')",20000,434590,5,197.6445159912109,10.44697380065918,0.4245060980319977,0.4637273252010345,0.6121844053268433,118271,132687,4356,4986,316319,301903,0,0,0,0,"tensor([2492, 2710, 2802, 2721, 2701, 2806, 3034, 2875, 2364, 1403, 286], device='cuda:0')","tensor([ 9, 9, 10, 14, 14, 13, 14, 12, 12, 6, 0], device='cuda:0')",20000,7,0,197.6445159912109,197.6445159912109,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,197.6445159912109,197.6445159912109,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,1,197.6445159912109,125.7876434326172,0.7092848420143127,0.7890572547912598,0.8500100374221802,5886,7081,169,325,4656,3461,0,0,0,0,"tensor([151, 165, 166, 147, 140, 137, 138, 143, 113, 73, 15], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,1,197.6445159912109,125.7876434326172,0.7028232216835022,0.7917801737785339,0.8403651118278503,5676,6974,178,344,4622,3324,0,0,0,0,"tensor([148, 161, 162, 143, 134, 133, 136, 140, 112, 73, 15], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,1,197.6445159912109,125.7876434326172,0.7182367444038391,0.7969542741775513,0.8539807200431824,5882,7065,172,340,4443,3260,0,0,0,0,"tensor([150, 164, 166, 147, 140, 137, 137, 142, 113, 73, 15], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,8,197.6445159912109,0.6787927746772766,0.0,0.34375,0.34375,0,11,0,0,53,42,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0], device='cuda:0')",20000,443761,3,197.6445159912109,36.49449920654297,0.4445259571075439,0.4751951992511749,0.627617597579956,128392,140323,5505,6507,315369,303438,0,0,0,0,"tensor([2589, 2929, 2972, 2890, 2869, 3018, 3233, 3005, 2420, 1421, 286], device='cuda:0')","tensor([ 9, 9, 10, 13, 13, 13, 14, 12, 12, 6, 0], device='cuda:0')",20000,0,0,197.6445159912109,197.6445159912109,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,6,197.6445159912109,5.190147399902344,0.0227135065943002,0.1151016876101493,0.1783881187438964,75,399,2,7,6452,6128,0,0,0,0,"tensor([ 2, 2, 3, 6, 9, 11, 14, 18, 16, 12, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,197.6445159912109,125.7876434326172,0.6348770260810852,0.7256349325180054,0.8143349289894104,6697,8458,189,643,7514,5753,0,0,0,0,"tensor([181, 207, 195, 178, 160, 173, 176, 176, 143, 83, 15], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,197.6445159912109,197.6445159912109,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,7,197.6445159912109,2.158414363861084,0.0,0.0886699482798576,0.1431980729103088,0,18,0,3,385,367,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0], device='cuda:0')",20000,18325,4,197.6445159912109,19.995819091796875,0.9447420835494996,0.9598081707954408,0.9563447833061218,17456,18209,1173,1409,869,116,0,0,0,0,"tensor([311, 375, 342, 334, 322, 342, 354, 308, 209, 93, 15], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,197.6445159912109,197.6445159912109,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,6,197.6445159912109,5.190147399902344,0.0092696174979209,0.0297798197716474,0.0540202967822551,29,94,10,1,6189,6124,0,0,0,0,"tensor([3, 3, 2, 3, 2, 2, 4, 3, 3, 3, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 8,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_8/,autoencoders/matryoshka_chess/trainer_8/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,185.87998962402344,105.26849365234376,1.1523008346557615,0.17431640625,0.9871097207069396,0.9890608191490172,0.9960524439811708,0.2971398532390594,0.2991375625133514,3.4657371044158936,0.999369502067566,2707,20000,1280000,3,223.5609893798828,38.76810073852539,0.4460926055908203,0.5101774334907532,0.6681070327758789,371081,444863,12614,19091,908919,835137,1570,3305,1559,3276,"tensor([7408, 8875, 8558, 8253, 8721, 8913, 9574, 8788, 6795, 4294, 1723], device='cuda:0')","tensor([ 52, 54, 64, 81, 111, 126, 137, 117, 88, 29, 5], device='cuda:0')",20000,578762,3,223.5609893798828,38.76810073852539,0.4120175540447235,0.5080770254135132,0.6779736876487732,151106,199517,3625,7102,427656,379245,49,203,49,203,"tensor([3301, 3845, 3799, 3630, 3810, 3777, 4081, 3798, 3113, 2089, 857], device='cuda:0')","tensor([ 48, 50, 58, 77, 106, 121, 132, 113, 83, 25, 2], device='cuda:0')",20000,221620,4,223.5609893798828,19.240917205810547,0.1023692414164543,0.326817125082016,0.5239232778549194,11975,43392,362,531,209645,178228,16,70,16,70,"tensor([203, 209, 238, 289, 346, 380, 412, 354, 298, 178, 65], device='cuda:0')","tensor([ 48, 50, 57, 76, 106, 121, 132, 113, 83, 25, 2], device='cuda:0')",20000,1280000,2,223.5609893798828,76.95247650146484,0.4646422863006592,0.5631247162818909,0.7080466151237488,391505,510537,13684,22692,888495,769463,1849,5902,1848,5886,"tensor([7708, 9265, 8900, 8567, 9066, 9288, 9955, 9156, 7008, 4340, 1723], device='cuda:0')","tensor([50, 53, 72, 79, 91, 95, 90, 69, 38, 12, 3], device='cuda:0')",20000,1922,3,223.5609893798828,38.76810073852539,0.0,0.0407539494335651,0.0807980149984359,0,40,0,1,1922,1882,0,0,0,0,"tensor([0, 0, 0, 2, 2, 3, 2, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,223.5609893798828,19.240917205810547,0.4766153395175934,0.8130623698234558,0.6381998658180237,208829,461406,9233,15339,449409,196832,0,0,0,0,"tensor([14646, 14605, 12965, 11855, 11477, 10792, 9809, 7613, 4712, 2182, 745], device='cuda:0')","tensor([38, 24, 27, 29, 21, 21, 32, 26, 17, 4, 2], device='cuda:0')",20000,392,3,223.5609893798828,38.76810073852539,0.0,0.9949109554290771,0.9911280274391174,0,391,0,3,392,1,0,0,0,0,"tensor([0, 0, 0, 3, 3, 3, 3, 4, 2, 1, 0], device='cuda:0')","tensor([0, 0, 0, 3, 3, 3, 3, 4, 2, 1, 0], device='cuda:0')",20000,434590,2,223.5609893798828,76.95247650146484,0.3853504359722137,0.4265465140342712,0.5698450207710266,104487,119317,3219,5549,330103,315273,0,0,0,0,"tensor([2140, 2383, 2437, 2411, 2627, 2633, 2853, 2624, 2113, 1309, 512], device='cuda:0')","tensor([ 6, 6, 7, 7, 9, 9, 9, 10, 11, 2, 0], device='cuda:0')",20000,7,0,223.5609893798828,223.5609893798828,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,223.5609893798828,223.5609893798828,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,223.5609893798828,19.240917205810547,0.6521053314208984,0.8367875814437866,0.8814207315444946,5165,7752,134,234,5377,2790,0,0,0,0,"tensor([123, 140, 135, 125, 135, 125, 133, 116, 99, 67, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,3,223.5609893798828,38.76810073852539,0.6551768779754639,0.6792147159576416,0.7630305290222168,5075,5449,119,298,5223,4849,0,0,0,0,"tensor([121, 136, 134, 124, 131, 122, 128, 110, 95, 65, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,223.5609893798828,19.240917205810547,0.661162257194519,0.8213256597518921,0.8759284019470215,5165,7410,134,309,5160,2915,0,0,0,0,"tensor([123, 140, 135, 124, 133, 124, 132, 116, 99, 67, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,223.5609893798828,223.5609893798828,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,2,223.5609893798828,76.95247650146484,0.4044106006622314,0.4562824368476867,0.5851842164993286,113568,133122,4318,6624,330193,310639,0,0,0,0,"tensor([2194, 2578, 2567, 2563, 2777, 2810, 3014, 2758, 2146, 1316, 512], device='cuda:0')","tensor([ 5, 5, 6, 6, 9, 9, 9, 10, 11, 2, 0], device='cuda:0')",20000,0,0,223.5609893798828,223.5609893798828,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,4,223.5609893798828,19.240917205810547,0.0848821848630905,0.1341132819652557,0.1913809776306152,290,470,16,12,6237,6057,0,0,0,0,"tensor([ 6, 6, 11, 14, 19, 20, 19, 15, 17, 14, 3], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,223.5609893798828,144.88111877441406,0.6221328973770142,0.7252975702285767,0.7793624997138977,6496,8379,176,515,7715,5832,0,0,0,0,"tensor([151, 177, 160, 154, 160, 157, 164, 147, 120, 74, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,223.5609893798828,223.5609893798828,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,5,223.5609893798828,9.294130325317385,0.0,0.1034482792019844,0.1034482792019844,0,21,0,0,385,364,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,223.5609893798828,76.95247650146484,0.9517622590065002,0.957761287689209,0.9564446210861206,17580,18242,1037,1526,745,83,0,0,0,0,"tensor([255, 317, 293, 282, 307, 326, 325, 283, 181, 86, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,223.5609893798828,223.5609893798828,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,3,223.5609893798828,38.76810073852539,0.0,0.0263450257480144,0.0362890549004077,0,83,0,0,6218,6135,0,0,0,0,"tensor([0, 0, 1, 2, 2, 2, 2, 3, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 9,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_9/,autoencoders/matryoshka_chess/trainer_9/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,206.3600006103516,124.09390258789062,1.077316164970398,0.165283203125,0.9887999296188354,0.9906377196311952,0.997454822063446,0.2971398532390594,0.3011258244514465,3.4657371044158936,0.9987420439720154,2422,20000,1280000,4,250.6846160888672,17.086719512939453,0.4175767004489898,0.4842879176139831,0.6405662298202515,340476,414288,10247,16628,939524,865712,1018,2877,1014,2824,"tensor([6989, 8031, 7741, 6988, 7174, 7833, 8021, 7005, 5623, 4114, 1231], device='cuda:0')","tensor([36, 39, 42, 61, 82, 94, 94, 82, 52, 24, 3], device='cuda:0')",20000,578762,4,250.6846160888672,17.086719512939453,0.3833200335502624,0.4679640829563141,0.6427057385444641,137876,178310,2740,4995,440886,400452,40,197,39,197,"tensor([3206, 3565, 3558, 3120, 3083, 3246, 3325, 3097, 2631, 2015, 614], device='cuda:0')","tensor([35, 38, 41, 57, 77, 88, 87, 77, 47, 20, 3], device='cuda:0')",20000,221620,4,250.6846160888672,17.086719512939453,0.0714291930198669,0.2798604965209961,0.4681375920772552,8218,36150,264,573,213402,185470,1,113,1,113,"tensor([199, 201, 213, 232, 278, 281, 286, 262, 215, 152, 48], device='cuda:0')","tensor([35, 38, 41, 57, 76, 87, 87, 77, 47, 20, 3], device='cuda:0')",20000,1280000,3,250.6846160888672,37.94621276855469,0.4335006177425384,0.5201236009597778,0.6796300411224365,357312,455680,11184,16519,922688,824320,1047,3517,1046,3516,"tensor([7204, 8321, 7986, 7230, 7450, 8206, 8375, 7261, 5730, 4138, 1233], device='cuda:0')","tensor([34, 38, 52, 61, 65, 65, 61, 50, 24, 8, 0], device='cuda:0')",20000,1922,6,250.6846160888672,2.932861566543579,0.0,0.035732515156269,0.0426829271018505,0,35,0,2,1922,1887,0,0,0,0,"tensor([0, 0, 0, 1, 1, 1, 2, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,250.6846160888672,37.94621276855469,0.5317820310592651,0.8037412166595459,0.6830700635910034,241721,452655,9139,15477,416517,205583,0,0,0,0,"tensor([13180, 13126, 11382, 10474, 10148, 9717, 8218, 5746, 3541, 1990, 534], device='cuda:0')","tensor([44, 30, 19, 17, 18, 16, 19, 21, 11, 2, 0], device='cuda:0')",20000,392,3,250.6846160888672,37.94621276855469,0.1333333402872085,0.983268976211548,0.9807446002960204,28,382,0,3,364,10,0,0,0,0,"tensor([2, 2, 2, 2, 2, 3, 2, 2, 2, 0, 0], device='cuda:0')","tensor([2, 2, 2, 2, 2, 3, 2, 2, 2, 0, 0], device='cuda:0')",20000,434590,5,250.6846160888672,7.329445838928223,0.3515827357769012,0.4055291712284088,0.5392999053001404,93203,111629,2398,4316,341387,322961,0,0,0,0,"tensor([2053, 2196, 2205, 2076, 2110, 2233, 2290, 2067, 1681, 1226, 374], device='cuda:0')","tensor([5, 5, 5, 6, 6, 6, 8, 7, 5, 3, 0], device='cuda:0')",20000,7,0,250.6846160888672,250.6846160888672,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,250.6846160888672,250.6846160888672,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,2,250.6846160888672,81.02434539794922,0.5918340086936951,0.741346538066864,0.7996423244476318,4450,6436,46,385,6092,4106,0,0,0,0,"tensor([119, 131, 132, 107, 98, 105, 103, 95, 84, 66, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,1,250.6846160888672,164.48936462402344,0.6000946760177612,0.6751889586448669,0.7629804611206055,4435,5361,48,221,5863,4937,0,0,0,0,"tensor([118, 130, 130, 106, 96, 101, 101, 93, 84, 66, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,250.6846160888672,37.94621276855469,0.6003643870353699,0.6743168830871582,0.7729420065879822,4449,5318,47,130,5876,5007,0,0,0,0,"tensor([119, 131, 131, 107, 98, 104, 103, 95, 84, 66, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,5,250.6846160888672,7.329445838928223,0.0,0.774193525314331,0.774193525314331,0,36,0,4,53,17,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0], device='cuda:0')",20000,443761,5,250.6846160888672,7.329445838928223,0.3736891448497772,0.4353797435760498,0.5615140199661255,102752,124900,3420,5091,341009,318861,0,0,0,0,"tensor([2105, 2374, 2310, 2185, 2274, 2476, 2470, 2157, 1713, 1227, 374], device='cuda:0')","tensor([4, 4, 4, 6, 6, 7, 8, 7, 5, 3, 0], device='cuda:0')",20000,0,0,250.6846160888672,250.6846160888672,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,5,250.6846160888672,7.329445838928223,0.0676713958382606,0.1087176501750946,0.172264814376831,229,376,12,14,6298,6151,0,0,0,0,"tensor([ 6, 5, 6, 7, 9, 13, 16, 15, 14, 11, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,4,250.6846160888672,17.086719512939453,0.5613084435462952,0.7030174136161804,0.7921177744865417,5594,7968,127,489,8617,6243,0,0,0,0,"tensor([141, 160, 147, 130, 127, 140, 136, 129, 96, 70, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,250.6846160888672,250.6846160888672,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,2,250.6846160888672,81.02434539794922,0.0,0.1170731708407402,0.1170731708407402,0,24,0,1,385,361,0,0,0,0,"tensor([0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,250.6846160888672,37.94621276855469,0.885317862033844,0.9572874903678894,0.9564446210861206,15123,18154,716,1449,3202,171,0,0,0,0,"tensor([214, 271, 243, 237, 257, 302, 285, 217, 139, 76, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,250.6846160888672,250.6846160888672,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,5,250.6846160888672,7.329445838928223,0.0269456319510936,0.036914337426424,0.0564566440880298,85,117,6,4,6133,6101,0,0,0,0,"tensor([1, 1, 2, 2, 4, 5, 4, 2, 2, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 10,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_10/,autoencoders/matryoshka_chess/trainer_10/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,225.0,133.30255126953125,0.997219979763031,0.161376953125,0.9904769062995912,0.9923064708709716,0.999607503414154,0.2971398532390594,0.2987338900566101,3.4657371044158936,0.9994969367980956,2086,20000,1280000,3,279.7274475097656,38.12222671508789,0.3855586051940918,0.472884863615036,0.6154607534408569,307515,401811,7651,17592,972485,878189,549,1757,548,1733,"tensor([5539, 6685, 6459, 6372, 6336, 6731, 7230, 6276, 4856, 3663, 892], device='cuda:0')","tensor([31, 33, 34, 45, 58, 66, 68, 70, 46, 19, 5], device='cuda:0')",20000,578762,3,279.7274475097656,38.12222671508789,0.3576056659221649,0.4543691277503967,0.6108437180519104,126471,171931,2088,6097,452291,406831,16,28,16,28,"tensor([2593, 3056, 2987, 2919, 2773, 2847, 3046, 2800, 2327, 1793, 446], device='cuda:0')","tensor([29, 31, 32, 42, 55, 63, 64, 66, 42, 16, 3], device='cuda:0')",20000,221620,4,279.7274475097656,16.270511627197266,0.0655454695224762,0.1852127462625503,0.3686877787113189,7518,22658,260,392,214102,198962,6,9,6,9,"tensor([177, 183, 180, 193, 230, 240, 237, 235, 190, 143, 39], device='cuda:0')","tensor([29, 31, 32, 41, 54, 63, 64, 66, 42, 16, 3], device='cuda:0')",20000,1280000,3,279.7274475097656,38.12222671508789,0.3985593318939209,0.5115478038787842,0.6617187857627869,320585,446316,8134,18647,959415,833684,605,3757,604,3750,"tensor([5699, 6895, 6661, 6554, 6547, 7010, 7538, 6492, 4931, 3685, 892], device='cuda:0')","tensor([22, 24, 36, 41, 42, 48, 46, 35, 16, 7, 2], device='cuda:0')",20000,1922,0,279.7274475097656,279.7274475097656,0.0195372756570577,0.0195372756570577,0.0195372756570577,19,19,4,4,1903,1903,0,0,0,0,"tensor([1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,279.7274475097656,16.270511627197266,0.6031376123428345,0.7782315015792847,0.730773389339447,288209,428290,9252,14147,370029,229948,0,0,0,0,"tensor([11537, 11488, 10143, 9390, 8951, 8391, 7162, 4922, 2731, 1766, 377], device='cuda:0')","tensor([23, 9, 9, 9, 6, 8, 10, 13, 8, 2, 0], device='cuda:0')",20000,392,6,279.7274475097656,3.3577582836151123,0.0,0.7258064150810242,0.7598115801811218,0,225,0,3,392,167,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 3, 2, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 3, 2, 1, 0, 0], device='cuda:0')",20000,434590,3,279.7274475097656,38.12222671508789,0.3315477967262268,0.3962053656578064,0.5184698700904846,86747,108401,1948,4205,347843,326189,0,0,0,0,"tensor([1690, 1908, 1848, 1838, 1837, 1935, 2039, 1847, 1460, 1093, 266], device='cuda:0')","tensor([5, 5, 5, 5, 5, 4, 4, 3, 4, 1, 0], device='cuda:0')",20000,7,0,279.7274475097656,279.7274475097656,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,279.7274475097656,279.7274475097656,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,279.7274475097656,16.270511627197266,0.5665718913078308,0.6822325587272644,0.777538001537323,4183,5537,41,153,6359,5005,0,0,0,0,"tensor([ 99, 114, 112, 105, 94, 89, 94, 87, 75, 57, 14], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,4,279.7274475097656,16.270511627197266,0.5740485191345215,0.6891418695449829,0.7738088369369507,4163,5509,43,181,6135,4789,0,0,0,0,"tensor([ 98, 113, 112, 103, 94, 89, 92, 84, 74, 57, 14], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,279.7274475097656,16.270511627197266,0.5750223398208618,0.6894785761833191,0.7821143865585327,4183,5521,41,169,6142,4804,0,0,0,0,"tensor([ 99, 114, 112, 105, 94, 89, 93, 87, 75, 57, 14], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,279.7274475097656,279.7274475097656,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,3,279.7274475097656,38.12222671508789,0.3568550944328308,0.4199866950511932,0.5387724041938782,97000,119385,2877,5372,346761,324376,0,0,0,0,"tensor([1714, 2012, 1922, 1921, 1956, 2100, 2217, 1910, 1478, 1102, 266], device='cuda:0')","tensor([5, 5, 5, 5, 5, 5, 4, 3, 4, 1, 0], device='cuda:0')",20000,0,0,279.7274475097656,279.7274475097656,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,7,279.7274475097656,1.830757021903992,0.0387445539236068,0.0694547146558761,0.1018129140138626,129,235,3,5,6398,6292,0,0,0,0,"tensor([ 6, 6, 7, 7, 9, 10, 10, 12, 13, 12, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,3,279.7274475097656,38.12222671508789,0.5152647495269775,0.7144467234611511,0.7928823828697205,4962,8244,87,623,9249,5967,0,0,0,0,"tensor([109, 133, 123, 117, 112, 122, 128, 108, 87, 62, 14], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,279.7274475097656,279.7274475097656,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,3,279.7274475097656,38.12222671508789,0.0,0.0938271582126617,0.1078431382775306,0,19,0,1,385,366,0,0,0,0,"tensor([0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,279.7274475097656,38.12222671508789,0.7843862771987915,0.9559459686279296,0.9564921855926514,12087,18119,407,1464,6238,206,0,0,0,0,"tensor([160, 213, 196, 205, 221, 251, 238, 178, 106, 68, 14], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,279.7274475097656,279.7274475097656,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,5,279.7274475097656,7.178698539733887,0.0127815939486026,0.0332015790045261,0.0558851063251495,40,105,1,2,6178,6113,0,0,0,0,"tensor([1, 1, 1, 1, 3, 3, 4, 4, 2, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 11,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_11/,autoencoders/matryoshka_chess/trainer_11/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,246.47999572753903,150.7337188720703,0.9477426409721376,0.1513671875,0.9913830757141112,0.99307781457901,0.9964675903320312,0.2971398532390594,0.2989752888679504,3.4657371044158936,0.9994207620620728,1834,20000,1280000,4,307.5908203125,14.154704093933104,0.352228581905365,0.4622261524200439,0.6014077067375183,274835,389720,5714,16554,1005165,890280,282,2143,281,2116,"tensor([5075, 5798, 5948, 5275, 5844, 6346, 6130, 5027, 3865, 2872, 1276], device='cuda:0')","tensor([30, 30, 38, 42, 50, 60, 63, 51, 33, 17, 3], device='cuda:0')",20000,578762,4,307.5908203125,14.154704093933104,0.3265658617019653,0.450388491153717,0.5963609218597412,113183,170048,1226,6307,465579,408714,5,78,5,78,"tensor([2380, 2633, 2739, 2421, 2608, 2705, 2586, 2258, 1857, 1425, 638], device='cuda:0')","tensor([30, 30, 37, 38, 45, 55, 58, 46, 31, 15, 2], device='cuda:0')",20000,221620,4,307.5908203125,14.154704093933104,0.0492680184543132,0.1474218368530273,0.3042555153369903,5600,17659,108,292,216020,203961,0,25,0,25,"tensor([157, 157, 173, 158, 191, 205, 205, 183, 144, 110, 51], device='cuda:0')","tensor([30, 30, 36, 37, 44, 55, 58, 46, 31, 15, 2], device='cuda:0')",20000,1280000,3,307.5908203125,38.10784912109375,0.3598130643367767,0.5018929839134216,0.6384214162826538,282110,435467,5982,19831,997890,844533,281,3864,281,3855,"tensor([5171, 5942, 6089, 5411, 6011, 6590, 6350, 5157, 3902, 2877, 1276], device='cuda:0')","tensor([24, 26, 36, 39, 42, 47, 37, 25, 14, 7, 1], device='cuda:0')",20000,1922,4,307.5908203125,14.154704093933104,0.0195573847740888,0.026694044470787,0.0457084774971008,19,26,2,0,1903,1896,0,0,0,0,"tensor([1, 1, 1, 0, 1, 1, 1, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,307.5908203125,38.10784912109375,0.6225662231445312,0.7678897976875305,0.7461495399475098,301643,419335,9150,14602,356595,238903,0,0,0,0,"tensor([10518, 10323, 9194, 8145, 8039, 7496, 5888, 3514, 2114, 1326, 544], device='cuda:0')","tensor([34, 6, 6, 6, 8, 12, 9, 10, 4, 4, 0], device='cuda:0')",20000,392,7,307.5908203125,0.728745698928833,0.0,0.1418439596891403,0.2331838309764862,0,30,0,1,392,362,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 0, 3, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 0, 3, 0, 0, 0], device='cuda:0')",20000,434590,2,307.5908203125,94.9520263671875,0.2992944121360779,0.3818100392818451,0.4889045357704162,76712,103645,1317,4679,357878,330945,0,0,0,0,"tensor([1514, 1648, 1739, 1555, 1711, 1789, 1695, 1484, 1147, 857, 385], device='cuda:0')","tensor([1, 1, 2, 3, 3, 3, 4, 2, 1, 1, 0], device='cuda:0')",20000,7,0,307.5908203125,307.5908203125,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,307.5908203125,307.5908203125,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,1,307.5908203125,206.7591094970703,0.5174952745437622,0.7074071764945984,0.7648141384124756,3690,5840,29,129,6852,4702,0,0,0,0,"tensor([89, 98, 95, 81, 85, 85, 79, 77, 61, 45, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,1,307.5908203125,206.7591094970703,0.5262181758880615,0.7162802219390869,0.7697629332542419,3688,5823,31,138,6610,4475,0,0,0,0,"tensor([89, 97, 94, 81, 85, 84, 78, 73, 60, 45, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,1,307.5908203125,206.7591094970703,0.5254912972450256,0.7157067656517029,0.7725602984428406,3690,5828,29,133,6635,4497,0,0,0,0,"tensor([89, 97, 94, 81, 85, 85, 78, 75, 61, 45, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,307.5908203125,307.5908203125,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,2,307.5908203125,94.9520263671875,0.3264983892440796,0.4085144102573395,0.5177521109580994,87003,115351,2182,5622,356758,328410,0,0,0,0,"tensor([1532, 1731, 1791, 1618, 1806, 1916, 1830, 1544, 1166, 858, 385], device='cuda:0')","tensor([1, 1, 2, 3, 3, 4, 4, 2, 1, 1, 0], device='cuda:0')",20000,0,0,307.5908203125,307.5908203125,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,6,307.5908203125,1.7606003284454346,0.0410856194794178,0.078529417514801,0.1195574104785919,137,267,5,6,6390,6260,0,0,0,0,"tensor([ 6, 6, 7, 7, 10, 12, 14, 9, 11, 11, 4], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,3,307.5908203125,38.10784912109375,0.4316340684890747,0.6584584712982178,0.7748645544052124,3916,7193,18,444,10295,7018,0,0,0,0,"tensor([ 95, 108, 110, 93, 100, 103, 101, 81, 65, 48, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,307.5908203125,307.5908203125,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,2,307.5908203125,94.9520263671875,0.0,0.1219512149691581,0.1219512149691581,0,25,0,0,385,360,0,0,0,0,"tensor([0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,307.5908203125,94.9520263671875,0.795721709728241,0.9552419781684875,0.9565670490264891,12424,18109,478,1481,5901,216,0,0,0,0,"tensor([140, 179, 178, 164, 190, 216, 183, 121, 79, 51, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,307.5908203125,307.5908203125,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,3,307.5908203125,38.10784912109375,0.0263450257480144,0.0325794741511344,0.0474022887647151,83,103,0,2,6135,6115,0,0,0,0,"tensor([1, 1, 1, 3, 2, 2, 2, 2, 2, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 12,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_12/,autoencoders/matryoshka_chess/trainer_12/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,269.1199951171875,167.6033172607422,0.8721848726272583,0.1435546875,0.992835283279419,0.9944320321083068,0.9963332414627076,0.2971398532390594,0.2992188632488251,3.4657371044158936,0.9993438720703124,1595,20000,1280000,2,337.0758972167969,112.9479751586914,0.2991271913051605,0.4374591708183288,0.5683576464653015,225694,362697,3323,15501,1054306,917303,154,858,154,857,"tensor([3721, 4577, 4687, 4532, 4364, 5055, 4887, 4066, 3275, 2467, 828], device='cuda:0')","tensor([20, 20, 23, 24, 28, 29, 33, 30, 24, 11, 2], device='cuda:0')",20000,578762,2,337.0758972167969,112.9479751586914,0.2837916016578674,0.421068400144577,0.5500198602676392,95815,155977,672,6124,482947,422785,3,16,3,16,"tensor([1789, 2107, 2203, 2143, 1979, 2134, 2058, 1831, 1580, 1225, 414], device='cuda:0')","tensor([19, 19, 22, 23, 25, 26, 29, 26, 21, 9, 1], device='cuda:0')",20000,221620,4,337.0758972167969,16.264436721801758,0.0392418764531612,0.1066585853695869,0.1927867531776428,4436,12491,29,113,217184,209129,0,2,0,2,"tensor([111, 112, 122, 132, 131, 147, 137, 132, 111, 85, 31], device='cuda:0')","tensor([19, 19, 22, 23, 25, 26, 29, 26, 21, 9, 1], device='cuda:0')",20000,1280000,2,337.0758972167969,112.9479751586914,0.3024581372737884,0.4674644768238067,0.6031171679496765,228665,395553,3379,16781,1051335,884447,159,2287,159,2282,"tensor([3780, 4686, 4797, 4612, 4462, 5217, 5053, 4182, 3317, 2471, 828], device='cuda:0')","tensor([12, 13, 20, 21, 23, 25, 26, 18, 13, 5, 1], device='cuda:0')",20000,1922,0,337.0758972167969,337.0758972167969,0.0154878674075007,0.0154878674075007,0.0154878674075007,15,15,0,0,1907,1907,0,0,0,0,"tensor([1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,337.0758972167969,16.264436721801758,0.5563461184501648,0.754757285118103,0.7174476981163025,256080,407124,6260,13459,402158,251114,0,0,0,0,"tensor([9076, 9020, 7779, 7119, 6657, 6445, 5019, 2872, 1756, 1106, 352], device='cuda:0')","tensor([43, 15, 1, 1, 0, 2, 2, 2, 2, 0, 0], device='cuda:0')",20000,392,5,337.0758972167969,5.462353706359863,0.0,0.324894517660141,0.4015904664993286,0,77,0,5,392,315,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 2, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 2, 1, 0, 0, 0], device='cuda:0')",20000,434590,2,337.0758972167969,112.9479751586914,0.2456619888544082,0.3592444956302643,0.4587824642658233,60948,95993,656,3833,373642,338597,0,0,0,0,"tensor([1119, 1263, 1357, 1311, 1218, 1343, 1314, 1149, 948, 728, 247], device='cuda:0')","tensor([0, 0, 0, 1, 2, 2, 2, 0, 1, 1, 0], device='cuda:0')",20000,7,0,337.0758972167969,337.0758972167969,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,337.0758972167969,337.0758972167969,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,5,337.0758972167969,5.462353706359863,0.4434449374675751,0.6893310546875,0.7573676705360413,3007,5647,13,195,7535,4895,0,0,0,0,"tensor([61, 73, 74, 70, 63, 65, 65, 61, 51, 39, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,337.0758972167969,5.462353706359863,0.4515693485736847,0.6955820322036743,0.7640689611434937,3007,5605,13,213,7291,4693,0,0,0,0,"tensor([61, 72, 74, 69, 63, 64, 65, 58, 51, 39, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,5,337.0758972167969,5.462353706359863,0.4506556987762451,0.6974701881408691,0.7608597874641418,3007,5638,13,204,7318,4687,0,0,0,0,"tensor([61, 73, 74, 69, 62, 65, 65, 61, 51, 39, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,337.0758972167969,337.0758972167969,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,2,337.0758972167969,112.9479751586914,0.2694250047206878,0.3881236910820007,0.4842833578586578,69279,108048,1233,4962,374482,335713,0,0,0,0,"tensor([1128, 1346, 1408, 1346, 1281, 1484, 1440, 1195, 953, 728, 247], device='cuda:0')","tensor([0, 0, 0, 1, 2, 3, 2, 0, 1, 1, 0], device='cuda:0')",20000,0,0,337.0758972167969,337.0758972167969,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,3,337.0758972167969,46.22982406616211,0.0310474745929241,0.0640569403767585,0.0866891220211982,103,216,5,1,6424,6311,0,0,0,0,"tensor([ 3, 3, 4, 8, 8, 9, 8, 8, 10, 6, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,4,337.0758972167969,16.264436721801758,0.4074488580226898,0.7016712427139282,0.7835557460784912,3643,7998,28,588,10568,6213,0,0,0,0,"tensor([74, 90, 93, 88, 75, 81, 79, 67, 58, 40, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,337.0758972167969,337.0758972167969,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,337.0758972167969,337.0758972167969,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,337.0758972167969,46.22982406616211,0.612881600856781,0.9544986486434937,0.9564172625541688,8212,18093,261,1493,10113,232,0,0,0,0,"tensor([ 88, 138, 118, 123, 137, 174, 162, 103, 66, 43, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,337.0758972167969,337.0758972167969,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,5,337.0758972167969,5.462353706359863,0.0178514495491981,0.0285351928323507,0.0440390035510063,56,90,0,0,6162,6128,0,0,0,0,"tensor([1, 1, 1, 2, 1, 3, 3, 3, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 13,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_13/,autoencoders/matryoshka_chess/trainer_13/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,290.79998779296875,185.5725555419922,0.793748140335083,0.14306640625,0.99406898021698,0.9956112504005432,0.9980422258377076,0.2971398532390594,0.2986774146556854,3.4657371044158936,0.9995147585868835,1352,20000,1280000,1,365.376708984375,259.6644592285156,0.2590256333351135,0.4453209638595581,0.5544421076774597,190772,372841,2225,21641,1089228,907159,16,259,16,258,"tensor([2884, 3624, 3758, 3770, 3692, 3759, 4111, 3227, 2533, 2033, 704], device='cuda:0')","tensor([ 9, 9, 9, 15, 16, 19, 20, 25, 16, 8, 1], device='cuda:0')",20000,578762,1,365.376708984375,259.6644592285156,0.2456686198711395,0.4183582365512848,0.5321542024612427,81086,155459,277,8965,497676,423303,3,8,3,8,"tensor([1391, 1668, 1746, 1767, 1685, 1606, 1701, 1441, 1224, 1005, 352], device='cuda:0')","tensor([ 9, 9, 8, 14, 15, 18, 18, 23, 15, 7, 0], device='cuda:0')",20000,221620,4,365.376708984375,16.70774269104004,0.0315090678632259,0.0761958435177803,0.1190460994839668,3548,8785,37,185,218072,212835,0,8,0,8,"tensor([ 91, 91, 94, 98, 102, 100, 108, 113, 85, 70, 24], device='cuda:0')","tensor([ 9, 9, 8, 14, 15, 18, 18, 23, 15, 7, 0], device='cuda:0')",20000,1280000,2,365.376708984375,126.8513641357422,0.2604385614395141,0.4666261374950409,0.5840609073638916,191972,396153,2249,21793,1088028,883847,14,1598,14,1598,"tensor([2912, 3698, 3856, 3832, 3754, 3870, 4229, 3316, 2559, 2038, 704], device='cuda:0')","tensor([ 6, 7, 8, 13, 13, 15, 14, 14, 6, 3, 1], device='cuda:0')",20000,1922,0,365.376708984375,365.376708984375,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,365.376708984375,50.06416320800781,0.4570319652557373,0.7312532663345337,0.6272329688072205,196420,387218,4888,13597,461818,271020,0,0,0,0,"tensor([8404, 8266, 7176, 6399, 5921, 5612, 4534, 2460, 1298, 912, 295], device='cuda:0')","tensor([56, 0, 0, 0, 0, 0, 2, 2, 4, 2, 0], device='cuda:0')",20000,392,0,365.376708984375,365.376708984375,0.0,0.0,0.0,0,0,0,0,392,392,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,434590,2,365.376708984375,126.8513641357422,0.2052164375782013,0.3507782220840454,0.4433852732181549,49734,93461,374,4827,384856,341129,0,0,0,0,"tensor([ 874, 1010, 1072, 1065, 1015, 1009, 1090, 925, 744, 601, 210], device='cuda:0')","tensor([1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0], device='cuda:0')",20000,7,0,365.376708984375,365.376708984375,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,365.376708984375,365.376708984375,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,1,365.376708984375,259.6644592285156,0.4006973505020141,0.7462857365608215,0.7993211150169373,2643,6505,7,386,7899,4037,0,0,0,0,"tensor([48, 58, 58, 61, 56, 53, 55, 47, 41, 32, 11], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,1,365.376708984375,259.6644592285156,0.4060324728488922,0.7528946399688721,0.8028160929679871,2625,6470,7,419,7673,3828,0,0,0,0,"tensor([47, 57, 58, 61, 55, 53, 54, 47, 41, 32, 11], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,1,365.376708984375,259.6644592285156,0.4073988199234009,0.7531365752220154,0.8055153489112854,2643,6483,7,408,7682,3842,0,0,0,0,"tensor([48, 58, 58, 61, 56, 53, 55, 47, 41, 32, 11], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,365.376708984375,365.376708984375,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,1,365.376708984375,259.6644592285156,0.2166215926408767,0.3817495107650757,0.4697044193744659,53973,106109,582,6039,389788,337652,0,0,0,0,"tensor([ 882, 1076, 1112, 1125, 1083, 1108, 1212, 976, 760, 601, 210], device='cuda:0')","tensor([1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0], device='cuda:0')",20000,0,0,365.376708984375,365.376708984375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,7,365.376708984375,0.6289972066879272,0.0221178606152534,0.0360848009586334,0.0428015552461147,73,120,1,4,6454,6407,0,0,0,0,"tensor([2, 2, 2, 2, 3, 3, 4, 4, 5, 3, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,365.376708984375,259.6644592285156,0.3364518582820892,0.7041983008384705,0.7816705107688904,2877,8068,14,635,11334,6143,0,0,0,0,"tensor([53, 70, 73, 69, 63, 58, 59, 52, 42, 33, 11], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,365.376708984375,365.376708984375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,365.376708984375,365.376708984375,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,365.376708984375,126.8513641357422,0.3588230013847351,0.9498290419578552,0.9565535187721252,4012,17919,25,1487,14313,406,0,0,0,0,"tensor([ 61, 99, 99, 93, 106, 140, 141, 85, 51, 33, 11], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,365.376708984375,365.376708984375,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,4,365.376708984375,16.70774269104004,0.0009644751553423,0.0118305357173085,0.0156374666839838,3,37,0,0,6215,6181,0,0,0,0,"tensor([1, 1, 0, 1, 2, 1, 1, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 14,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_14/,autoencoders/matryoshka_chess/trainer_14/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,309.47998046875,204.3821563720703,0.7023541331291199,0.13916015625,0.9953594207763672,0.9967126250267028,0.9986053109169006,0.2971398532390594,0.2979722023010254,3.4657371044158936,0.9997373223304749,1164,20000,1280000,3,393.4605102539063,56.844947814941406,0.2130104154348373,0.4293578267097473,0.5344139933586121,152706,354428,1083,16540,1127294,925572,12,177,12,177,"tensor([1933, 2410, 2892, 3126, 3007, 2929, 3028, 2364, 1759, 1395, 384], device='cuda:0')","tensor([ 6, 6, 4, 6, 6, 7, 6, 11, 8, 4, 1], device='cuda:0')",20000,578762,3,393.4605102539063,56.844947814941406,0.2108270972967147,0.408626914024353,0.50666344165802,68215,150199,141,6179,510547,428563,1,0,1,0,"tensor([ 925, 1070, 1329, 1439, 1376, 1252, 1223, 1053, 860, 697, 192], device='cuda:0')","tensor([6, 6, 4, 5, 5, 6, 4, 9, 6, 2, 0], device='cuda:0')",20000,221620,4,393.4605102539063,18.005733489990234,0.0219897888600826,0.0335481502115726,0.0608966201543808,2464,3782,20,65,219156,217838,0,0,0,0,"tensor([59, 60, 61, 66, 67, 64, 64, 64, 59, 47, 8], device='cuda:0')","tensor([6, 6, 4, 5, 5, 6, 4, 9, 6, 2, 0], device='cuda:0')",20000,1280000,2,393.4605102539063,146.6195831298828,0.2135041952133178,0.4507453143596649,0.5594671964645386,153103,378853,1089,22154,1126897,901147,11,809,11,806,"tensor([1955, 2473, 2970, 3206, 3070, 2998, 3129, 2408, 1777, 1396, 384], device='cuda:0')","tensor([5, 5, 5, 6, 6, 5, 4, 7, 3, 2, 1], device='cuda:0')",20000,1922,0,393.4605102539063,393.4605102539063,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,393.4605102539063,56.844947814941406,0.2931473851203918,0.7249541282653809,0.5155528783798218,113486,381763,2535,13205,544752,276475,0,0,0,0,"tensor([7755, 7642, 6494, 5829, 5256, 4809, 3789, 1835, 915, 583, 152], device='cuda:0')","tensor([70, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,7,393.4605102539063,0.5513486862182617,0.0,0.3277311027050018,0.3463917374610901,0,78,0,6,392,314,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 2, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 2, 1, 0, 0], device='cuda:0')",20000,434590,3,393.4605102539063,56.844947814941406,0.165179431438446,0.3285518288612366,0.4169001579284668,39141,86166,190,3764,395449,348424,0,0,0,0,"tensor([577, 647, 798, 867, 819, 748, 752, 624, 508, 413, 109], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,7,0,393.4605102539063,393.4605102539063,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,393.4605102539063,393.4605102539063,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,1,393.4605102539063,290.9395751953125,0.3543276488780975,0.729699432849884,0.7631155848503113,2270,6178,1,213,8272,4364,0,0,0,0,"tensor([34, 39, 46, 51, 46, 40, 36, 31, 27, 22, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,1,393.4605102539063,290.9395751953125,0.3610470294952392,0.7376115918159485,0.770105242729187,2269,6155,2,236,8029,4143,0,0,0,0,"tensor([34, 39, 46, 51, 46, 40, 36, 31, 27, 22, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,1,393.4605102539063,290.9395751953125,0.3604319095611572,0.7379755973815918,0.770959734916687,2270,6168,1,223,8055,4157,0,0,0,0,"tensor([34, 39, 46, 51, 46, 40, 36, 31, 27, 22, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,393.4605102539063,393.4605102539063,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,2,393.4605102539063,146.6195831298828,0.1809466481208801,0.3714318871498108,0.4514307379722595,44185,102562,430,5929,399576,341199,0,0,0,0,"tensor([585, 717, 850, 908, 863, 814, 852, 660, 514, 413, 109], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,393.4605102539063,393.4605102539063,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,5,393.4605102539063,4.92664909362793,0.0295849069952964,0.0355047360062599,0.0422788597643375,98,118,0,2,6429,6409,0,0,0,0,"tensor([3, 3, 3, 4, 4, 5, 4, 4, 3, 3, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,393.4605102539063,290.9395751953125,0.2800459861755371,0.7019050121307373,0.7612709403038025,2315,8014,7,610,11896,6197,0,0,0,0,"tensor([34, 44, 55, 59, 53, 46, 47, 34, 28, 22, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,393.4605102539063,393.4605102539063,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,393.4605102539063,393.4605102539063,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,393.4605102539063,146.6195831298828,0.4375238120555877,0.9448016881942748,0.9564558863639832,5163,17630,113,1365,13162,695,0,0,0,0,"tensor([ 43, 80, 80, 90, 80, 105, 106, 67, 38, 22, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,393.4605102539063,393.4605102539063,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,6,393.4605102539063,1.4221495389938354,0.0,0.002248634584248,0.002248634584248,0,7,0,1,6218,6211,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 15,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_15/,autoencoders/matryoshka_chess/trainer_15/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,331.0799865722656,231.2666778564453,0.605963945388794,0.1396484375,0.9964300990104676,0.997648298740387,0.998993992805481,0.2971398532390594,0.2977020740509033,3.4657371044158936,0.9998225569725036,1027,20000,1280000,2,420.1065673828125,175.76390075683594,0.1695823818445205,0.4128341674804687,0.5106173753738403,118635,337546,508,17716,1161365,942454,0,132,0,132,"tensor([1326, 1643, 2380, 2176, 2139, 1966, 1890, 1606, 1259, 1011, 640], device='cuda:0')","tensor([4, 4, 5, 3, 3, 2, 2, 3, 1, 1, 1], device='cuda:0')",20000,578762,3,420.1065673828125,71.7101058959961,0.1730343103408813,0.39340940117836,0.4834910631179809,54819,143370,39,6727,523943,435392,0,0,0,0,"tensor([ 645, 734, 1089, 993, 974, 828, 716, 689, 605, 503, 320], device='cuda:0')","tensor([3, 3, 4, 2, 2, 1, 1, 2, 0, 0, 0], device='cuda:0')",20000,221620,4,420.1065673828125,22.68703842163086,0.0139884576201438,0.0157662201672792,0.0220759809017181,1561,1761,3,8,220059,219859,0,0,0,0,"tensor([39, 39, 41, 39, 38, 41, 33, 36, 31, 29, 18], device='cuda:0')","tensor([3, 3, 4, 2, 2, 1, 1, 2, 0, 0, 0], device='cuda:0')",20000,1280000,2,420.1065673828125,175.76390075683594,0.1707085818052292,0.4342121481895447,0.5308112502098083,119503,360367,579,19499,1160497,919633,0,148,0,148,"tensor([1333, 1682, 2428, 2228, 2176, 2005, 1945, 1645, 1268, 1013, 640], device='cuda:0')","tensor([4, 4, 5, 3, 2, 1, 1, 3, 1, 1, 1], device='cuda:0')",20000,1922,0,420.1065673828125,420.1065673828125,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,420.1065673828125,71.7101058959961,0.1812182515859604,0.7057012915611267,0.4335786700248718,65714,365687,1295,12454,592524,292551,0,0,0,0,"tensor([7363, 7266, 6241, 5271, 4512, 4064, 3198, 1537, 695, 438, 261], device='cuda:0')","tensor([84, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,0,420.1065673828125,420.1065673828125,0.0,0.0,0.0,0,0,0,0,392,392,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,434590,3,420.1065673828125,71.7101058959961,0.1289442032575607,0.3299247026443481,0.402958869934082,29952,86774,31,4659,404638,347816,0,0,0,0,"tensor([395, 437, 612, 564, 550, 482, 430, 410, 358, 294, 181], device='cuda:0')","tensor([0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,7,0,420.1065673828125,420.1065673828125,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,420.1065673828125,420.1065673828125,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,420.1065673828125,71.7101058959961,0.2877791225910187,0.7037543654441833,0.7565260529518127,1772,5914,1,351,8770,4628,0,0,0,0,"tensor([22, 25, 39, 35, 33, 25, 22, 22, 19, 16, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,3,420.1065673828125,71.7101058959961,0.2935962378978729,0.7114652991294861,0.7631741762161255,1772,5892,1,373,8526,4406,0,0,0,0,"tensor([22, 25, 39, 35, 33, 25, 22, 21, 19, 16, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,420.1065673828125,71.7101058959961,0.292941004037857,0.7127184867858887,0.7636343240737915,1772,5912,1,353,8553,4413,0,0,0,0,"tensor([22, 25, 38, 35, 33, 25, 21, 21, 19, 16, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,420.1065673828125,420.1065673828125,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,2,420.1065673828125,175.76390075683594,0.1396129429340362,0.35211843252182,0.4317998886108398,33318,95919,212,5131,410443,347842,0,0,0,0,"tensor([401, 498, 685, 633, 591, 537, 522, 458, 359, 294, 181], device='cuda:0')","tensor([0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,420.1065673828125,420.1065673828125,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,8,420.1065673828125,0.3095001876354217,0.0064141722396016,0.0100609762594103,0.0100594423711299,21,33,0,0,6506,6494,0,0,0,0,"tensor([1, 1, 1, 1, 1, 1, 1, 2, 2, 1, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,2,420.1065673828125,175.76390075683594,0.2218468338251114,0.6813518404960632,0.7637842893600464,1773,7671,0,635,12438,6540,0,0,0,0,"tensor([22, 27, 46, 43, 39, 27, 25, 23, 19, 17, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,420.1065673828125,420.1065673828125,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,420.1065673828125,420.1065673828125,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,420.1065673828125,175.76390075683594,0.3022644519805908,0.9392760396003724,0.955839216709137,3277,17386,81,1309,15048,939,0,0,0,0,"tensor([26, 55, 69, 60, 60, 65, 75, 50, 29, 17, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,420.1065673828125,420.1065673828125,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,4,420.1065673828125,22.68703842163086,0.0,0.005772931035608,0.005772931035608,0,18,0,0,6218,6200,0,0,0,0,"tensor([0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 16,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_16/,autoencoders/matryoshka_chess/trainer_16/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,354.1199951171875,263.7771301269531,0.5032786726951599,0.140380859375,0.997511625289917,0.99853253364563,0.9994965195655824,0.2971398532390594,0.2971544563770294,3.4657371044158936,0.9999954104423524,959,20000,1280000,3,444.8411865234375,99.7497100830078,0.1473166346549987,0.4165587723255157,0.5097283124923706,101784,341195,56,16965,1178216,938805,0,62,0,62,"tensor([ 729, 949, 1474, 1635, 1642, 1709, 1359, 1351, 872, 686, 384], device='cuda:0')","tensor([2, 2, 2, 2, 2, 2, 2, 1, 1, 0, 0], device='cuda:0')",20000,578762,3,444.8411865234375,99.7497100830078,0.160487562417984,0.3877716064453125,0.479607880115509,50495,140726,13,6331,528267,438036,0,0,0,0,"tensor([363, 423, 630, 722, 740, 745, 499, 521, 421, 343, 192], device='cuda:0')","tensor([2, 2, 2, 2, 2, 2, 2, 1, 1, 0, 0], device='cuda:0')",20000,221620,5,444.8411865234375,8.821205139160156,0.01121730171144,0.0125369364395737,0.0184077601879835,1250,1398,0,3,220370,220222,0,0,0,0,"tensor([21, 21, 24, 23, 20, 26, 18, 19, 19, 16, 10], device='cuda:0')","tensor([2, 2, 2, 2, 2, 2, 2, 1, 1, 0, 0], device='cuda:0')",20000,1280000,2,444.8411865234375,219.1645965576172,0.1482591480016708,0.43842813372612,0.5310550332069397,102492,364918,114,19747,1177508,915082,0,75,0,75,"tensor([ 730, 965, 1530, 1687, 1684, 1741, 1396, 1389, 883, 687, 384], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,1922,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,444.8411865234375,33.7834587097168,0.116059772670269,0.693767786026001,0.4113825559616089,40559,355198,136,10532,617679,303040,0,0,0,0,"tensor([7073, 6954, 6015, 5065, 4262, 3812, 2961, 1761, 476, 277, 156], device='cuda:0')","tensor([70, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,392,392,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,434590,3,444.8411865234375,99.7497100830078,0.1164725720882415,0.3278601765632629,0.3987822830677032,26875,86111,17,4590,407715,348479,0,0,0,0,"tensor([216, 250, 361, 403, 408, 415, 290, 304, 238, 188, 106], device='cuda:0')","tensor([1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0], device='cuda:0')",20000,7,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,444.8411865234375,99.7497100830078,0.2632619440555572,0.6373626589775085,0.743094265460968,1598,5046,0,246,8944,5496,0,0,0,0,"tensor([12, 14, 20, 26, 25, 25, 16, 16, 13, 11, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,444.8411865234375,8.821205139160156,0.2686617076396942,0.6316612958908081,0.7396373152732849,1598,4842,0,191,8700,5456,0,0,0,0,"tensor([12, 14, 20, 24, 25, 25, 16, 16, 13, 11, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,5,444.8411865234375,8.821205139160156,0.2680533230304718,0.6301602125167847,0.7387822270393372,1598,4839,0,194,8727,5486,0,0,0,0,"tensor([12, 14, 19, 24, 25, 25, 16, 16, 13, 11, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,2,444.8411865234375,219.1645965576172,0.1142030358314514,0.3595170974731445,0.4306481778621673,26875,98512,17,5751,416886,345249,0,0,0,0,"tensor([216, 281, 428, 452, 447, 450, 349, 355, 239, 188, 106], device='cuda:0')","tensor([1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0], device='cuda:0')",20000,0,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,0,444.8411865234375,444.8411865234375,0.0064141722396016,0.0064141722396016,0.0064141722396016,21,21,0,0,6506,6506,0,0,0,0,"tensor([1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,3,444.8411865234375,99.7497100830078,0.2021633237600326,0.7308760285377502,0.790064811706543,1598,8556,0,646,12613,5655,0,0,0,0,"tensor([12, 15, 29, 33, 32, 28, 17, 18, 14, 11, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,444.8411865234375,219.1645965576172,0.2853283584117889,0.941283881664276,0.9546682834625244,3063,17522,82,1383,15262,803,0,0,0,0,"tensor([14, 31, 56, 58, 53, 50, 52, 51, 19, 11, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,444.8411865234375,444.8411865234375,0.0,0.0,0.0,0,0,0,0,6218,6218,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 17,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_17/,autoencoders/matryoshka_chess/trainer_17/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,374.4400024414063,298.1107482910156,0.4023542702198028,0.14306640625,0.9982938766479492,0.9991299510002136,0.999351680278778,0.2971398532390594,0.2970591783523559,3.4657371044158936,1.0000253915786743,926,20000,1280000,3,463.7056274414063,130.10643005371094,0.139067068696022,0.4231197237968445,0.5062435865402222,95673,348331,253,18158,1184327,931669,0,25,0,25,"tensor([ 445, 627, 1125, 1344, 1626, 1552, 1299, 1095, 809, 689, 320], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,578762,3,463.7056274414063,130.10643005371094,0.144511878490448,0.3875398337841034,0.4741684794425964,45076,140638,0,6399,533686,438124,0,0,0,0,"tensor([222, 263, 476, 573, 736, 680, 463, 403, 379, 344, 160], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,221620,5,463.7056274414063,12.08640480041504,0.008339773863554,0.0115468995645642,0.015648990869522,928,1287,0,10,220692,220333,0,0,0,0,"tensor([13, 13, 15, 13, 18, 20, 14, 14, 15, 18, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,1280000,3,463.7056274414063,130.10643005371094,0.139067068696022,0.4431793093681335,0.5279509425163269,95673,370080,253,20034,1184327,909920,0,27,0,27,"tensor([ 445, 646, 1167, 1401, 1679, 1593, 1346, 1130, 826, 690, 320], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0], device='cuda:0')",20000,1922,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,463.7056274414063,46.81441116333008,0.1430990099906921,0.689012885093689,0.3896455764770508,50800,351441,960,10450,607438,306797,0,0,0,0,"tensor([7080, 6901, 6101, 5168, 4331, 3792, 3149, 1690, 498, 292, 129], device='cuda:0')","tensor([113, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,392,392,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,434590,3,463.7056274414063,130.10643005371094,0.1027366071939468,0.3086998462677002,0.3905979096889496,23533,80040,0,3932,411057,354550,0,0,0,0,"tensor([128, 153, 251, 317, 393, 381, 274, 234, 216, 192, 91], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,7,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,463.7056274414063,130.10643005371094,0.2357961684465408,0.6415979862213135,0.7392550110816956,1409,5059,0,169,9133,5483,0,0,0,0,"tensor([ 7, 9, 15, 21, 24, 21, 14, 12, 12, 11, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,3,463.7056274414063,130.10643005371094,0.2407106906175613,0.6509081721305847,0.747413694858551,1409,5053,0,175,8889,5245,0,0,0,0,"tensor([ 7, 9, 15, 21, 24, 21, 14, 12, 12, 11, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,463.7056274414063,130.10643005371094,0.2401568293571472,0.6505497694015503,0.7469795346260071,1409,5059,0,169,8916,5266,0,0,0,0,"tensor([ 7, 8, 15, 21, 24, 21, 14, 12, 12, 11, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,3,463.7056274414063,130.10643005371094,0.1007203087210655,0.3498390316963196,0.4231343567371368,23533,95201,0,5294,420228,348560,0,0,0,0,"tensor([128, 191, 317, 376, 450, 416, 331, 286, 225, 192, 91], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,0,463.7056274414063,463.7056274414063,0.0064141722396016,0.0064141722396016,0.0064141722396016,21,21,0,0,6506,6506,0,0,0,0,"tensor([1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,3,463.7056274414063,130.10643005371094,0.1804097443819046,0.7216004729270935,0.7751142382621765,1409,8350,0,582,12802,5861,0,0,0,0,"tensor([ 7, 9, 20, 26, 32, 26, 17, 13, 13, 11, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,463.7056274414063,260.09442138671875,0.1427992284297943,0.9197517037391664,0.9509011507034302,1409,16596,0,1167,16916,1729,0,0,0,0,"tensor([ 7, 25, 45, 51, 48, 42, 54, 44, 20, 12, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,463.7056274414063,463.7056274414063,0.0,0.0,0.0,0,0,0,0,6218,6218,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 18,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_18/,autoencoders/matryoshka_chess/trainer_18/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,396.1199951171875,327.78759765625,0.2994136214256286,0.14892578125,0.9989476203918456,0.9995769262313844,0.9999226331710817,0.2971398532390594,0.297252207994461,3.4657371044158936,0.9999645352363586,945,20000,1280000,3,479.9798889160156,153.7305908203125,0.1123375669121742,0.4178402721881866,0.5051209330558777,76177,343031,39,18893,1203823,936969,0,1,0,1,"tensor([ 484, 672, 1174, 1299, 1469, 1578, 1211, 995, 709, 562, 128], device='cuda:0')","tensor([0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,578762,3,479.9798889160156,153.7305908203125,0.1232209876179695,0.3843036293983459,0.4703598022460937,38000,139341,16,7058,540762,439421,0,0,0,0,"tensor([240, 288, 503, 547, 654, 720, 441, 364, 306, 281, 64], device='cuda:0')","tensor([0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,221620,4,479.9798889160156,56.425899505615234,0.0029736426658928,0.0186615176498889,0.0224839355796575,330,2088,0,68,221290,219532,0,0,0,0,"tensor([ 8, 8, 16, 9, 8, 17, 8, 6, 6, 10, 0], device='cuda:0')","tensor([0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,1280000,3,479.9798889160156,153.7305908203125,0.1125251874327659,0.4370624423027038,0.5314302444458008,76312,363634,42,20357,1203688,916366,0,4,0,4,"tensor([ 487, 689, 1220, 1352, 1553, 1613, 1250, 1024, 736, 562, 128], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,1922,0,479.9798889160156,479.9798889160156,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,479.9798889160156,56.425899505615234,0.1828483492136001,0.6834139823913574,0.4074762463569641,66447,347162,2114,10564,591791,311076,0,0,0,0,"tensor([7226, 7042, 6358, 5350, 4447, 3838, 3331, 1705, 500, 217, 44], device='cuda:0')","tensor([141, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,7,479.9798889160156,0.707748532295227,0.0,0.0769230723381042,0.0769230723381042,0,16,0,8,392,376,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0], device='cuda:0')",20000,434590,4,479.9798889160156,56.425899505615234,0.0862203761935234,0.2996345162391662,0.3919396102428436,19580,77146,15,3198,415010,357444,0,0,0,0,"tensor([134, 170, 270, 324, 360, 393, 224, 194, 178, 155, 32], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,7,0,479.9798889160156,479.9798889160156,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,479.9798889160156,479.9798889160156,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,479.9798889160156,153.7305908203125,0.205904871225357,0.6579174995422363,0.7517256140708923,1210,5314,1,298,9332,5228,0,0,0,0,"tensor([ 8, 9, 18, 22, 24, 23, 13, 11, 9, 9, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,3,479.9798889160156,153.7305908203125,0.2102702260017395,0.6668761968612671,0.7517147064208984,1210,5305,1,307,9088,4993,0,0,0,0,"tensor([ 8, 9, 17, 22, 23, 23, 13, 11, 9, 9, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,479.9798889160156,153.7305908203125,0.2097780704498291,0.6664993166923523,0.7506265640258789,1210,5311,1,301,9115,5014,0,0,0,0,"tensor([ 8, 9, 17, 22, 23, 23, 13, 11, 9, 9, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,479.9798889160156,479.9798889160156,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,3,479.9798889160156,153.7305908203125,0.0845138430595398,0.3461321294307709,0.4267877340316772,19580,94037,15,5561,424181,349724,0,0,0,0,"tensor([134, 198, 339, 367, 402, 426, 276, 248, 200, 155, 32], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,479.9798889160156,479.9798889160156,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,2,479.9798889160156,294.2054748535156,0.0064141722396016,0.0085430974140763,0.0085430974140763,21,28,0,0,6506,6499,0,0,0,0,"tensor([1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,3,479.9798889160156,153.7305908203125,0.1570483744144439,0.719303548336029,0.7626778483390808,1211,8304,0,574,13000,5907,0,0,0,0,"tensor([ 8, 10, 23, 25, 32, 28, 14, 11, 11, 9, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,479.9798889160156,479.9798889160156,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,479.9798889160156,479.9798889160156,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,479.9798889160156,294.2054748535156,0.1238738670945167,0.9188246130943298,0.951447069644928,1210,16588,1,1194,17115,1737,0,0,0,0,"tensor([ 8, 22, 44, 54, 49, 41, 50, 40, 21, 9, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,479.9798889160156,479.9798889160156,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,479.9798889160156,479.9798889160156,0.0,0.0,0.0,0,0,0,0,6218,6218,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 19,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_19/,autoencoders/matryoshka_chess/trainer_19/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,417.1600036621094,345.0899963378906,0.2415286749601364,0.155029296875,0.9992709159851074,0.9997320175170898,1.0000089406967163,0.2971398532390594,0.2971441149711609,3.4657371044158936,0.9999986290931702,959,20000,1280000,3,491.1651306152344,171.44285583496094,0.105163425207138,0.4137053191661834,0.5089551210403442,71040,338611,0,18356,1208960,941389,0,0,0,0,"tensor([ 320, 508, 1073, 1107, 1525, 1326, 1185, 1088, 638, 442, 128], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0], device='cuda:0')",20000,578762,3,491.1651306152344,171.44285583496094,0.1156472042202949,0.3854517340660095,0.4824675321578979,35520,139887,0,7185,543242,438875,0,0,0,0,"tensor([160, 210, 458, 458, 681, 600, 424, 392, 285, 221, 64], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0], device='cuda:0')",20000,221620,4,491.1651306152344,62.45164108276367,0.0019834116101264,0.0095201740041375,0.0211002677679061,220,1060,0,5,221400,220560,0,0,0,0,"tensor([2, 2, 6, 3, 4, 7, 2, 5, 4, 3, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0], device='cuda:0')",20000,1280000,3,491.1651306152344,171.44285583496094,0.105163425207138,0.4365899264812469,0.5309632420539856,71040,363152,0,20432,1208960,916848,0,0,0,0,"tensor([ 320, 519, 1102, 1161, 1582, 1354, 1233, 1133, 656, 442, 128], device='cuda:0')","tensor([0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0], device='cuda:0')",20000,1922,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,491.1651306152344,62.45164108276367,0.5067163705825806,0.6814160943031311,0.5490741729736328,225505,345648,6321,10613,432733,312590,0,0,0,0,"tensor([7262, 7148, 6525, 5440, 4635, 3891, 3500, 1797, 473, 161, 44], device='cuda:0')","tensor([141, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,392,392,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,434590,3,491.1651306152344,171.44285583496094,0.079924002289772,0.3028175830841064,0.3947020173072815,18090,78338,0,4466,416500,356252,0,0,0,0,"tensor([ 83, 114, 244, 247, 371, 329, 215, 193, 160, 113, 32], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,7,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,491.1651306152344,62.45164108276367,0.1905252188444137,0.6831424832344055,0.7651702761650085,1110,5639,0,328,9432,4903,0,0,0,0,"tensor([ 5, 6, 18, 17, 25, 19, 12, 11, 8, 7, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,3,491.1651306152344,171.44285583496094,0.1946002691984176,0.6632255911827087,0.7468493580818176,1110,5204,0,191,9188,5094,0,0,0,0,"tensor([ 5, 6, 18, 16, 24, 19, 12, 11, 8, 7, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,491.1651306152344,62.45164108276367,0.1941407918930053,0.6916278004646301,0.7718788385391235,1110,5634,0,333,9215,4691,0,0,0,0,"tensor([ 5, 6, 18, 17, 25, 19, 12, 11, 8, 7, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,3,491.1651306152344,171.44285583496094,0.0783369541168212,0.3363688588142395,0.4272024929523468,18090,90809,0,5367,425671,352952,0,0,0,0,"tensor([ 83, 144, 306, 303, 403, 346, 275, 255, 173, 113, 32], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,6527,6527,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,4,491.1651306152344,62.45164108276367,0.1448991447687149,0.6785227656364441,0.7408599853515625,1110,7478,0,353,13101,6733,0,0,0,0,"tensor([ 5, 8, 22, 22, 33, 23, 14, 12, 9, 7, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,491.1651306152344,171.44285583496094,0.1142269149422645,0.9274491667747498,0.9541409611701964,1110,16823,0,1130,17215,1502,0,0,0,0,"tensor([ 5, 19, 43, 51, 50, 41, 53, 50, 17, 7, 2], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,491.1651306152344,491.1651306152344,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,5,491.1651306152344,15.71800422668457,0.0,0.0019280203850939,0.0019280203850939,0,6,0,0,6218,6212,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 20,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_20/,autoencoders/matryoshka_chess/trainer_20/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,10.039999961853027,24.282865524291992,2.18735671043396,0.022705078125,0.9504439830780028,0.9532387852668762,0.9542193412780762,0.2971398532390594,0.3797755837440491,3.4657371044158936,0.9739204049110411,5677,20000,1280000,0,13.689407348632812,13.689407348632812,0.677017092704773,0.677017092704773,0.7649813890457153,671558,671558,32315,32315,608442,608442,15703,15703,15413,15413,"tensor([15391, 15412, 15493, 15724, 15809, 15789, 15085, 13893, 11227, 6501, 1458], device='cuda:0')","tensor([308, 308, 312, 354, 401, 438, 425, 383, 263, 82, 2], device='cuda:0')",20000,578762,0,13.689407348632812,13.689407348632812,0.7328805327415466,0.7328805327415466,0.800858199596405,341862,341862,12303,12303,236900,236900,1519,1519,1489,1489,"tensor([6160, 6176, 6234, 6390, 6491, 6534, 6259, 5845, 4900, 3040, 727], device='cuda:0')","tensor([302, 302, 306, 347, 390, 425, 411, 368, 255, 77, 2], device='cuda:0')",20000,221620,3,13.689407348632812,12.509857177734377,0.7357309460639954,0.7442184090614319,0.8110419511795044,130689,132760,2954,2397,90931,88860,900,794,888,788,"tensor([738, 738, 749, 804, 875, 954, 965, 867, 611, 286, 63], device='cuda:0')","tensor([300, 300, 304, 345, 388, 425, 411, 368, 255, 77, 2], device='cuda:0')",20000,1280000,0,13.689407348632812,13.689407348632812,0.6999298334121704,0.6999298334121704,0.778143584728241,706813,706813,32855,32855,573187,573187,17556,17556,17532,17532,"tensor([16374, 16384, 16446, 16653, 16653, 16543, 15767, 14466, 11603, 6634, 1458], device='cuda:0')","tensor([236, 234, 237, 242, 254, 264, 224, 191, 121, 34, 0], device='cuda:0')",20000,1922,2,13.689407348632812,13.43654727935791,0.0505305714905262,0.0680680647492408,0.1279069781303405,50,68,7,8,1872,1854,0,0,0,0,"tensor([4, 4, 5, 5, 5, 4, 4, 4, 4, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,0,13.689407348632812,13.689407348632812,0.8947720527648926,0.8947720527648926,0.91414475440979,546963,546963,17374,17374,111275,111275,0,0,0,0,"tensor([19317, 19316, 19215, 18984, 18466, 17574, 15818, 13225, 9132, 3887, 643], device='cuda:0')","tensor([ 81, 81, 81, 87, 105, 119, 103, 93, 51, 22, 0], device='cuda:0')",20000,392,3,13.689407348632812,12.509857177734377,0.9949238896369934,1.0,0.9949238896369934,392,392,4,0,0,0,0,0,0,0,"tensor([16, 16, 16, 14, 13, 10, 10, 7, 5, 1, 0], device='cuda:0')","tensor([16, 16, 16, 14, 13, 10, 10, 7, 5, 1, 0], device='cuda:0')",20000,434590,4,13.689407348632812,10.720606803894045,0.5248658061027527,0.5516120791435242,0.686937689781189,157750,168237,8766,7156,276840,266353,0,0,0,0,"tensor([4169, 4173, 4223, 4351, 4416, 4542, 4480, 4219, 3462, 2033, 434], device='cuda:0')","tensor([28, 28, 31, 37, 34, 41, 43, 39, 28, 12, 0], device='cuda:0')",20000,7,0,13.689407348632812,13.689407348632812,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,13.689407348632812,13.689407348632812,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,1,13.689407348632812,13.661259651184082,0.9377766847610474,0.9389286637306212,0.9337424635887146,9638,9632,375,343,904,910,0,0,0,0,"tensor([228, 228, 229, 229, 231, 222, 197, 185, 154, 96, 23], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,1,13.689407348632812,13.661259651184082,0.8581084609031677,0.8592010736465454,0.8635079860687256,7998,7991,345,312,2300,2307,0,0,0,0,"tensor([219, 219, 220, 222, 223, 216, 191, 180, 149, 93, 23], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,1,13.689407348632812,13.661259651184082,0.9316996335983276,0.9328008890151978,0.9276950359344482,9467,9460,530,498,858,865,0,0,0,0,"tensor([226, 226, 227, 227, 229, 219, 195, 182, 153, 96, 23], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,7,13.689407348632812,3.2004027366638184,0.0,0.7356322407722473,0.7356322407722473,0,32,0,2,53,21,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0], device='cuda:0')",20000,443761,4,13.689407348632812,10.720606803894045,0.5761760473251343,0.5824461579322815,0.7004029750823975,183729,185745,10263,8304,260032,258016,0,0,0,0,"tensor([4532, 4534, 4575, 4689, 4729, 4810, 4679, 4368, 3572, 2060, 434], device='cuda:0')","tensor([31, 31, 34, 37, 40, 44, 43, 40, 28, 12, 0], device='cuda:0')",20000,0,0,13.689407348632812,13.689407348632812,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,7,13.689407348632812,3.2004027366638184,0.0931586623191833,0.1430189758539199,0.2375734895467758,320,505,23,30,6207,6022,0,0,0,0,"tensor([ 9, 9, 9, 10, 11, 12, 13, 21, 22, 15, 8], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,0,13.689407348632812,13.689407348632812,0.7322946786880493,0.7322946786880493,0.7787019610404968,8484,8484,476,476,5727,5727,0,0,0,0,"tensor([310, 310, 309, 311, 306, 282, 268, 239, 201, 111, 23], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,13.689407348632812,13.689407348632812,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,6,13.689407348632812,5.623547554016113,0.0651629045605659,0.5454545617103577,0.5974955558776855,13,147,1,7,372,238,0,0,0,0,"tensor([1, 1, 1, 1, 3, 3, 4, 3, 3, 1, 0], device='cuda:0')","tensor([1, 1, 1, 1, 3, 3, 4, 3, 3, 1, 0], device='cuda:0')",20000,18325,2,13.689407348632812,13.43654727935791,0.9665524959564208,0.9669488072395324,0.9632105231285096,18061,18051,986,960,264,274,0,0,0,0,"tensor([631, 631, 630, 630, 608, 585, 527, 469, 328, 145, 23], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,5,13.689407348632812,8.274242401123047,0.0139257302507758,0.0551589876413345,0.0551589876413345,21,85,7,9,2967,2903,0,0,0,0,"tensor([2, 2, 2, 2, 2, 3, 3, 2, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,13.689407348632812,13.689407348632812,0.0470957607030868,0.0470957607030868,0.078939251601696,150,150,2,2,6068,6068,0,0,0,0,"tensor([4, 4, 4, 4, 4, 5, 6, 6, 6, 4, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 21,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_21/,autoencoders/matryoshka_chess/trainer_21/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,31.559999465942383,37.72310256958008,1.5667568445205688,0.060302734375,0.9745681881904602,0.9769627451896667,0.9839387536048888,0.2971398532390594,0.3148456513881683,3.4657371044158936,0.994412124156952,7359,20000,1280000,3,39.44126129150391,24.461658477783203,0.6480461955070496,0.7156028747558594,0.8155298233032227,632985,732128,40533,34057,647015,547872,11726,17678,11572,17446,"tensor([24183, 23414, 22916, 23234, 22391, 21390, 19528, 16978, 12321, 7405, 1792], device='cuda:0')","tensor([217, 228, 292, 410, 483, 502, 461, 384, 229, 82, 11], device='cuda:0')",20000,578762,3,39.44126129150391,24.461658477783203,0.6563358902931213,0.7712779641151428,0.8604903817176819,291336,371154,17667,12523,287426,207608,819,1690,793,1667,"tensor([9972, 9733, 9614, 9844, 9521, 9059, 8252, 7210, 5453, 3521, 891], device='cuda:0')","tensor([210, 221, 284, 394, 469, 488, 449, 373, 223, 76, 9], device='cuda:0')",20000,221620,3,39.44126129150391,24.461658477783203,0.4142716526985168,0.7671194076538086,0.877489447593689,58566,139544,2556,2649,163054,82076,167,814,162,804,"tensor([ 573, 586, 713, 924, 1087, 1152, 1072, 920, 586, 291, 78], device='cuda:0')","tensor([210, 220, 283, 392, 467, 486, 449, 373, 223, 76, 9], device='cuda:0')",20000,1280000,2,39.44126129150391,30.91281509399414,0.7260088920593262,0.7433886528015137,0.8325177431106567,754884,780031,44661,38551,525116,499969,18955,21978,18833,21931,"tensor([25722, 24878, 24303, 24489, 23527, 22443, 20402, 17709, 12734, 7503, 1792], device='cuda:0')","tensor([210, 230, 277, 328, 324, 297, 261, 190, 96, 31, 3], device='cuda:0')",20000,1922,4,39.44126129150391,18.217622756958008,0.0347470641136169,0.1231813728809356,0.22232386469841,34,127,1,13,1888,1795,0,0,0,0,"tensor([2, 2, 2, 4, 6, 3, 6, 4, 2, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,39.44126129150391,24.461658477783203,0.899654746055603,0.911303162574768,0.933271825313568,558023,567165,24266,19331,100215,91073,0,0,0,0,"tensor([31836, 30485, 28906, 27529, 25469, 23104, 19777, 15832, 9662, 4080, 801], device='cuda:0')","tensor([ 54, 58, 74, 98, 106, 105, 112, 86, 62, 20, 4], device='cuda:0')",20000,392,3,39.44126129150391,24.461658477783203,0.9751243591308594,0.9961880445480348,0.9560975432395936,392,392,20,3,0,0,0,0,0,0,"tensor([22, 26, 27, 26, 21, 17, 17, 13, 7, 2, 0], device='cuda:0')","tensor([22, 26, 27, 26, 21, 17, 17, 13, 7, 2, 0], device='cuda:0')",20000,434590,4,39.44126129150391,18.217622756958008,0.5450332164764404,0.60060715675354,0.7256067395210266,166763,190806,10584,9981,267827,243784,0,0,0,0,"tensor([6203, 6079, 6141, 6603, 6539, 6374, 5931, 5278, 3840, 2266, 541], device='cuda:0')","tensor([34, 35, 40, 46, 41, 42, 43, 40, 24, 5, 0], device='cuda:0')",20000,7,0,39.44126129150391,39.44126129150391,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,39.44126129150391,39.44126129150391,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,0,39.44126129150391,39.44126129150391,0.8891186118125916,0.8891186118125916,0.9042433500289916,9029,9029,739,739,1513,1513,0,0,0,0,"tensor([402, 387, 388, 372, 346, 312, 279, 233, 184, 118, 28], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,0,39.44126129150391,39.44126129150391,0.8350750207901001,0.8350750207901001,0.8618890047073364,7871,7871,682,682,2427,2427,0,0,0,0,"tensor([385, 369, 370, 355, 334, 303, 269, 227, 179, 117, 28], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,0,39.44126129150391,39.44126129150391,0.8652154207229614,0.8652154207229614,0.892177164554596,8406,8406,700,700,1919,1919,0,0,0,0,"tensor([395, 382, 384, 369, 344, 309, 276, 233, 183, 118, 28], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,39.44126129150391,7.487692832946777,0.0,0.8800000548362732,0.8800000548362732,0,44,0,3,53,9,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')",20000,443761,3,39.44126129150391,24.461658477783203,0.5714128613471985,0.6273874640464783,0.7414781451225281,182203,208111,11764,11549,261558,235650,0,0,0,0,"tensor([6918, 6706, 6688, 7026, 6904, 6698, 6185, 5457, 3949, 2300, 541], device='cuda:0')","tensor([32, 33, 45, 52, 47, 47, 45, 41, 24, 5, 0], device='cuda:0')",20000,0,0,39.44126129150391,39.44126129150391,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,4,39.44126129150391,18.217622756958008,0.1117511540651321,0.2204767167568206,0.3173516094684601,388,814,29,43,6139,5713,0,0,0,0,"tensor([13, 13, 13, 17, 24, 25, 21, 22, 20, 18, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,0,39.44126129150391,39.44126129150391,0.7823613286018372,0.7823613286018372,0.8171253204345703,9625,9625,769,769,4586,4586,0,0,0,0,"tensor([559, 541, 515, 496, 448, 409, 366, 305, 229, 130, 28], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,39.44126129150391,39.44126129150391,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,6,39.44126129150391,7.487692832946777,0.1078431382775306,0.5225564241409302,0.5888689160346985,22,139,1,8,363,246,0,0,0,0,"tensor([2, 3, 3, 1, 3, 2, 4, 2, 2, 1, 0], device='cuda:0')","tensor([2, 3, 3, 1, 3, 2, 4, 2, 2, 1, 0], device='cuda:0')",20000,18325,4,39.44126129150391,18.217622756958008,0.9617828130722046,0.9669537544250488,0.957019031047821,18321,18244,1452,1166,4,81,0,0,0,0,"tensor([1055, 1017, 956, 922, 860, 812, 695, 567, 355, 155, 28], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,4,39.44126129150391,18.217622756958008,0.0,0.0539661906659603,0.0539661906659603,0,83,0,5,2988,2905,0,0,0,0,"tensor([0, 0, 0, 0, 2, 1, 1, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,5,39.44126129150391,12.46676540374756,0.023204069584608,0.051314141601324,0.0919926613569259,73,164,1,10,6145,6054,0,0,0,0,"tensor([ 1, 1, 2, 3, 6, 8, 10, 10, 8, 3, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 22,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_22/,autoencoders/matryoshka_chess/trainer_22/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,53.27999877929688,44.19829940795898,1.4454305171966553,0.08544921875,0.9786109328269958,0.9806315302848816,0.9877928495407104,0.2971398532390594,0.304265409708023,3.4657371044158936,0.9977511763572692,7630,20000,1280000,3,67.90042877197266,29.615976333618164,0.6418352127075195,0.702315628528595,0.8115577697753906,626849,712423,46453,36360,653151,567577,9869,18723,9742,18415,"tensor([27168, 25703, 24698, 24677, 24352, 22713, 21225, 18469, 13358, 7405, 1633], device='cuda:0')","tensor([152, 167, 259, 391, 479, 505, 465, 401, 252, 80, 7], device='cuda:0')",20000,578762,3,67.90042877197266,29.615976333618164,0.6284792423248291,0.7426955103874207,0.8440088033676147,274576,349807,20441,13424,304186,228955,529,1627,518,1592,"tensor([11156, 10771, 10448, 10443, 10331, 9546, 8941, 7836, 5923, 3557, 810], device='cuda:0')","tensor([149, 163, 247, 377, 463, 485, 450, 389, 243, 74, 5], device='cuda:0')",20000,221620,4,67.90042877197266,21.369977951049805,0.3213899135589599,0.7012064456939697,0.8303667306900024,42759,120604,1709,1766,178861,101016,97,468,95,456,"tensor([ 484, 502, 659, 924, 1103, 1157, 1128, 983, 638, 302, 71], device='cuda:0')","tensor([149, 159, 243, 373, 460, 483, 449, 389, 243, 74, 5], device='cuda:0')",20000,1280000,2,67.90042877197266,41.01959991455078,0.7007288932800293,0.7465832829475403,0.8310068845748901,718704,787673,52600,42401,561296,492327,14762,24689,14647,24603,"tensor([28925, 27293, 26170, 26028, 25569, 23854, 22241, 19288, 13834, 7490, 1633], device='cuda:0')","tensor([139, 167, 258, 328, 339, 312, 262, 203, 118, 39, 3], device='cuda:0')",20000,1922,4,67.90042877197266,21.369977951049805,0.0165118686854839,0.2189512252807617,0.2334241569042205,16,238,0,14,1906,1684,0,0,0,0,"tensor([ 1, 1, 1, 3, 10, 8, 6, 2, 1, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,2,67.90042877197266,41.01959991455078,0.8554198741912842,0.9059329628944396,0.931312620639801,508962,562824,22770,21467,149276,95414,0,0,0,0,"tensor([37953, 34339, 31294, 29358, 27394, 24595, 21465, 16928, 10369, 4074, 735], device='cuda:0')","tensor([ 54, 56, 78, 102, 115, 107, 106, 79, 45, 15, 4], device='cuda:0')",20000,392,2,67.90042877197266,41.01959991455078,0.897698163986206,0.9744898080825806,0.927639365196228,351,382,39,10,41,10,0,0,0,0,"tensor([26, 29, 29, 26, 22, 22, 17, 11, 7, 0, 0], device='cuda:0')","tensor([26, 29, 29, 26, 22, 22, 17, 11, 7, 0, 0], device='cuda:0')",20000,434590,3,67.90042877197266,29.615976333618164,0.5475361347198486,0.5815329551696777,0.7247751355171204,168461,182392,12291,10298,266129,252198,0,0,0,0,"tensor([6692, 6536, 6565, 6941, 7075, 6728, 6455, 5676, 4134, 2284, 500], device='cuda:0')","tensor([19, 21, 29, 43, 44, 37, 39, 29, 18, 10, 0], device='cuda:0')",20000,7,0,67.90042877197266,67.90042877197266,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,67.90042877197266,67.90042877197266,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,67.90042877197266,21.369977951049805,0.8841626048088074,0.963872253894806,0.9197022318840028,9125,10365,974,600,1417,177,0,0,0,0,"tensor([450, 441, 412, 391, 374, 327, 295, 248, 194, 117, 25], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,6,67.90042877197266,8.632699966430664,0.8517683148384094,0.8917157649993896,0.9045897722244264,8309,8622,903,418,1989,1676,0,0,0,0,"tensor([429, 424, 394, 381, 364, 320, 286, 240, 188, 117, 25], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,67.90042877197266,21.369977951049805,0.8629818558692932,0.9560351967811584,0.9199051856994628,8361,10166,691,776,1964,159,0,0,0,0,"tensor([444, 438, 408, 387, 373, 325, 295, 247, 194, 117, 25], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,7,67.90042877197266,3.772550582885742,0.0,0.6329113245010376,0.6329113245010376,0,25,0,1,53,28,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0], device='cuda:0')",20000,443761,3,67.90042877197266,29.615976333618164,0.5741158723831177,0.6120648384094238,0.7389723658561707,184005,200865,13237,11726,259756,242896,0,0,0,0,"tensor([7592, 7215, 7088, 7443, 7446, 7046, 6745, 5899, 4291, 2318, 501], device='cuda:0')","tensor([25, 27, 34, 48, 47, 44, 43, 34, 18, 10, 0], device='cuda:0')",20000,0,0,67.90042877197266,67.90042877197266,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,5,67.90042877197266,14.64547634124756,0.0969943329691886,0.2199565023183822,0.3309424817562103,334,809,26,20,6193,5718,0,0,0,0,"tensor([15, 14, 18, 28, 30, 30, 30, 28, 19, 20, 8], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,67.90042877197266,56.01319122314453,0.7919663786888123,0.7957336902618408,0.8326162099838257,10075,10072,1157,1032,4136,4139,0,0,0,0,"tensor([662, 627, 559, 520, 480, 437, 402, 354, 251, 131, 26], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,67.90042877197266,67.90042877197266,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,3,67.90042877197266,29.615976333618164,0.2690582871437073,0.5162523984909058,0.588652491569519,60,135,1,3,325,250,0,0,0,0,"tensor([2, 2, 3, 4, 5, 3, 3, 3, 2, 2, 0], device='cuda:0')","tensor([2, 2, 3, 4, 5, 3, 3, 3, 2, 2, 0], device='cuda:0')",20000,18325,4,67.90042877197266,21.369977951049805,0.9568328261375428,0.9633051753044128,0.9563447833061218,18320,18245,1648,1310,5,80,0,0,0,0,"tensor([1251, 1138, 1040, 989, 928, 854, 752, 615, 385, 156, 26], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,3,67.90042877197266,29.615976333618164,0.0,0.2454810440540313,0.2454810440540313,0,421,0,21,2988,2567,0,0,0,0,"tensor([0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,4,67.90042877197266,21.369977951049805,0.0089643020182847,0.0666253492236137,0.1151122450828552,28,215,1,21,6190,6003,0,0,0,0,"tensor([ 2, 2, 3, 6, 11, 10, 14, 9, 9, 5, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 23,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_23/,autoencoders/matryoshka_chess/trainer_23/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,75.23999786376953,51.57380294799805,1.3267871141433716,0.09716796875,0.9821213483810424,0.98383891582489,0.9910586476325988,0.2971398532390594,0.3046708106994629,3.4657371044158936,0.9976232647895812,7498,20000,1280000,3,93.43958282470705,31.87608528137207,0.6277143955230713,0.7049192786216736,0.8072109818458557,604934,716893,42484,37079,675066,563107,9051,18494,8926,18198,"tensor([24985, 25207, 24269, 23999, 23163, 21893, 20002, 17542, 13251, 7945, 1995], device='cuda:0')","tensor([138, 157, 233, 347, 448, 484, 446, 366, 217, 75, 12], device='cuda:0')",20000,578762,3,93.43958282470705,31.87608528137207,0.6079316735267639,0.7546074986457825,0.844366729259491,260444,359535,17614,14609,318318,219227,478,1830,455,1808,"tensor([10208, 10519, 10279, 10238, 9808, 9187, 8360, 7440, 5923, 3811, 992], device='cuda:0')","tensor([132, 149, 225, 338, 438, 469, 432, 350, 209, 70, 11], device='cuda:0')",20000,221620,4,93.43958282470705,22.20099639892578,0.2942111790180206,0.7045385837554932,0.8264017701148987,38489,121510,1533,1805,183131,100110,79,531,77,527,"tensor([ 434, 472, 646, 872, 1037, 1112, 1060, 891, 607, 315, 76], device='cuda:0')","tensor([132, 148, 219, 333, 435, 467, 431, 350, 209, 70, 11], device='cuda:0')",20000,1280000,2,93.43958282470705,46.01613998413086,0.6702471971511841,0.743659496307373,0.8270891308784485,668718,782998,46719,42799,611282,497002,12868,23298,12769,23223,"tensor([26553, 26710, 25662, 25269, 24326, 22983, 21005, 18334, 13725, 8061, 1996], device='cuda:0')","tensor([130, 161, 232, 278, 297, 281, 246, 189, 95, 33, 2], device='cuda:0')",20000,1922,5,93.43958282470705,14.417158126831056,0.0,0.1086637377738952,0.1672177463769912,0,111,0,10,1922,1811,0,0,0,0,"tensor([0, 0, 0, 3, 4, 6, 4, 3, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,93.43958282470705,31.87608528137207,0.8354478478431702,0.9005709290504456,0.9232358932495116,487191,555741,20870,20218,171047,102497,0,0,0,0,"tensor([36172, 33538, 30308, 28025, 25940, 23538, 20665, 16101, 10225, 4448, 868], device='cuda:0')","tensor([ 37, 44, 49, 77, 98, 103, 111, 76, 46, 14, 2], device='cuda:0')",20000,392,3,93.43958282470705,31.87608528137207,0.7433903813362122,0.9974424839019777,0.9300118684768676,239,390,12,0,153,2,0,0,0,0,"tensor([10, 16, 23, 26, 23, 19, 17, 14, 7, 0, 0], device='cuda:0')","tensor([10, 16, 23, 26, 23, 19, 17, 14, 7, 0, 0], device='cuda:0')",20000,434590,3,93.43958282470705,31.87608528137207,0.5342381596565247,0.571298360824585,0.7128032445907593,162566,177952,11434,10432,272024,256638,0,0,0,0,"tensor([6274, 6440, 6571, 6739, 6843, 6572, 6008, 5374, 4072, 2439, 592], device='cuda:0')","tensor([20, 23, 32, 32, 36, 33, 38, 35, 24, 5, 0], device='cuda:0')",20000,7,0,93.43958282470705,93.43958282470705,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,93.43958282470705,93.43958282470705,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,93.43958282470705,22.20099639892578,0.8892408013343811,0.9723633527755736,0.9274722933769226,8984,10432,680,483,1558,110,0,0,0,0,"tensor([400, 417, 390, 377, 340, 302, 261, 236, 189, 126, 30], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,6,93.43958282470705,8.07957649230957,0.8435259461402893,0.9079114198684692,0.9144757986068726,8000,8957,670,476,2298,1341,0,0,0,0,"tensor([388, 404, 379, 366, 330, 291, 255, 227, 187, 126, 30], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,93.43958282470705,22.20099639892578,0.8535600304603577,0.9634547829627992,0.9214186668395996,8134,10229,600,680,2191,96,0,0,0,0,"tensor([394, 410, 384, 369, 337, 301, 259, 236, 189, 126, 30], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,93.43958282470705,8.07957649230957,0.0,0.8333333134651184,0.8333333134651184,0,40,0,3,53,13,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')",20000,443761,3,93.43958282470705,31.87608528137207,0.5638470649719238,0.599679708480835,0.7322741746902466,179128,194868,12489,11278,264633,248893,0,0,0,0,"tensor([7103, 7160, 7079, 7178, 7216, 6865, 6257, 5563, 4190, 2472, 592], device='cuda:0')","tensor([23, 26, 36, 38, 39, 36, 40, 39, 24, 5, 0], device='cuda:0')",20000,0,0,93.43958282470705,93.43958282470705,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,3,93.43958282470705,31.87608528137207,0.086626797914505,0.1786855608224868,0.3227680027484894,297,643,33,27,6230,5884,0,0,0,0,"tensor([11, 12, 20, 21, 20, 23, 24, 27, 24, 19, 4], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,93.43958282470705,68.53560638427734,0.7860493063926697,0.7891291975975037,0.8305139541625977,9804,9887,930,960,4407,4324,0,0,0,0,"tensor([588, 592, 549, 502, 459, 416, 366, 323, 248, 141, 32], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,93.43958282470705,93.43958282470705,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,5,93.43958282470705,14.417158126831056,0.0,0.4581673145294189,0.5233644843101501,0,115,0,2,385,270,0,0,0,0,"tensor([0, 1, 1, 4, 2, 3, 5, 3, 1, 0, 0], device='cuda:0')","tensor([0, 1, 1, 4, 2, 3, 5, 3, 1, 0, 0], device='cuda:0')",20000,18325,4,93.43958282470705,22.20099639892578,0.957116723060608,0.9622085690498352,0.9563447833061218,18324,18281,1641,1392,1,44,0,0,0,0,"tensor([1111, 1075, 999, 931, 884, 821, 727, 572, 376, 172, 32], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,3,93.43958282470705,31.87608528137207,0.0,0.3436051309108734,0.3436051309108734,0,630,0,49,2988,2358,0,0,0,0,"tensor([0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,6,93.43958282470705,8.07957649230957,0.007370613515377,0.052895151078701,0.0776938498020172,23,169,0,3,6195,6049,0,0,0,0,"tensor([1, 1, 2, 5, 6, 6, 8, 9, 8, 3, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 24,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_24/,autoencoders/matryoshka_chess/trainer_24/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,99.0,60.51531600952149,1.2662074565887451,0.098876953125,0.9838665127754213,0.9855208992958068,0.9940615892410278,0.2971398532390594,0.30583456158638,3.4657371044158936,0.9972559809684752,7174,20000,1280000,3,122.67159271240234,32.60905456542969,0.6191109418869019,0.6869203448295593,0.7952708601951599,590986,688311,38158,35738,689014,591689,8339,16956,8239,16709,"tensor([23992, 24161, 23415, 21973, 21573, 20586, 18879, 16787, 12451, 7178, 1980], device='cuda:0')","tensor([144, 147, 214, 331, 421, 428, 412, 357, 222, 65, 7], device='cuda:0')",20000,578762,3,122.67159271240234,32.60905456542969,0.6000874638557434,0.7318328619003296,0.832137405872345,254534,341991,15027,13862,324228,236771,721,1754,696,1733,"tensor([10170, 10344, 10115, 9441, 9212, 8752, 7938, 7131, 5451, 3466, 987], device='cuda:0')","tensor([140, 143, 209, 322, 410, 413, 399, 343, 214, 58, 5], device='cuda:0')",20000,221620,4,122.67159271240234,21.6458797454834,0.305912435054779,0.6853649020195007,0.8056058287620544,40311,116389,1615,1632,181309,105231,85,509,81,504,"tensor([ 462, 472, 625, 833, 994, 1019, 988, 862, 593, 286, 82], device='cuda:0')","tensor([140, 142, 205, 318, 406, 412, 399, 343, 214, 58, 5], device='cuda:0')",20000,1280000,2,122.67159271240234,50.29164123535156,0.6519441604614258,0.7378374934196472,0.8207448124885559,638992,772244,41274,41019,641008,507756,11144,22002,11088,21936,"tensor([25329, 25509, 24675, 23118, 22628, 21570, 19785, 17554, 12896, 7268, 1980], device='cuda:0')","tensor([114, 143, 219, 268, 278, 264, 228, 180, 103, 28, 3], device='cuda:0')",20000,1922,3,122.67159271240234,32.60905456542969,0.0185471419245004,0.0643863230943679,0.1271844655275344,18,64,1,2,1904,1858,0,0,0,0,"tensor([1, 1, 1, 3, 3, 4, 4, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,122.67159271240234,32.60905456542969,0.7581568360328674,0.8971025943756104,0.8655561208724976,413567,551004,19175,19166,244671,107234,0,0,0,0,"tensor([33414, 31351, 28660, 26105, 24254, 22287, 19189, 15555, 9664, 3946, 869], device='cuda:0')","tensor([ 42, 43, 61, 85, 117, 95, 83, 75, 46, 10, 2], device='cuda:0')",20000,392,3,122.67159271240234,32.60905456542969,0.7255216836929321,0.9987261295318604,0.9714993834495544,226,392,5,1,166,0,0,0,0,0,"tensor([13, 15, 20, 20, 21, 18, 17, 9, 7, 0, 0], device='cuda:0')","tensor([13, 15, 20, 20, 21, 18, 17, 9, 7, 0, 0], device='cuda:0')",20000,434590,3,122.67159271240234,32.60905456542969,0.5385169982910156,0.5733206868171692,0.7022591233253479,163906,178731,10235,10173,270684,255859,0,0,0,0,"tensor([6205, 6298, 6368, 6238, 6377, 6142, 5689, 5170, 3863, 2159, 595], device='cuda:0')","tensor([14, 14, 19, 29, 28, 33, 30, 26, 19, 5, 0], device='cuda:0')",20000,7,0,122.67159271240234,122.67159271240234,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,122.67159271240234,122.67159271240234,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,122.67159271240234,32.60905456542969,0.8552106022834778,0.963440477848053,0.9176964163780212,8346,10462,630,714,2196,80,0,0,0,0,"tensor([417, 426, 393, 353, 339, 303, 264, 221, 171, 113, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,3,122.67159271240234,32.60905456542969,0.7967668771743774,0.8148473501205444,0.8651092052459717,7196,7409,569,478,3102,2889,0,0,0,0,"tensor([403, 414, 381, 343, 324, 293, 257, 216, 168, 113, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,122.67159271240234,21.6458797454834,0.8575899600982666,0.9275279641151428,0.90618097782135,8220,9778,625,981,2105,547,0,0,0,0,"tensor([416, 424, 388, 348, 335, 300, 263, 219, 171, 113, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,7,122.67159271240234,3.378822326660156,0.0,0.7415730357170105,0.7415730357170105,0,33,0,3,53,20,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0], device='cuda:0')",20000,443761,2,122.67159271240234,50.29164123535156,0.5652986764907837,0.5919324159622192,0.7220829725265503,179328,191552,11365,11896,264433,252209,0,0,0,0,"tensor([6855, 6894, 6857, 6603, 6728, 6400, 5914, 5342, 3977, 2178, 595], device='cuda:0')","tensor([18, 18, 25, 28, 32, 34, 29, 26, 19, 5, 0], device='cuda:0')",20000,0,0,122.67159271240234,122.67159271240234,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,2,122.67159271240234,50.29164123535156,0.2029859125614166,0.2270518392324447,0.3488111495971679,741,841,33,40,5786,5686,0,0,0,0,"tensor([14, 13, 16, 18, 25, 28, 27, 24, 21, 19, 8], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,2,122.67159271240234,50.29164123535156,0.7635974884033203,0.7689462304115295,0.8209090828895569,9301,9355,849,766,4910,4856,0,0,0,0,"tensor([551, 553, 517, 463, 435, 395, 349, 315, 222, 125, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,122.67159271240234,122.67159271240234,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,6,122.67159271240234,7.522722721099853,0.0455696210265159,0.4823529124259949,0.5776965022087097,9,123,1,2,376,262,0,0,0,0,"tensor([1, 1, 0, 3, 3, 4, 5, 3, 2, 1, 0], device='cuda:0')","tensor([1, 1, 0, 3, 3, 4, 5, 3, 2, 1, 0], device='cuda:0')",20000,18325,4,122.67159271240234,21.6458797454834,0.9573355317115784,0.9614907503128052,0.9562948346138,18310,18189,1617,1321,15,136,0,0,0,0,"tensor([1016, 1001, 922, 856, 796, 755, 661, 563, 353, 149, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,3,122.67159271240234,32.60905456542969,0.0,0.3588633239269256,0.3588633239269256,0,663,0,44,2988,2325,0,0,0,0,"tensor([0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,6,122.67159271240234,7.522722721099853,0.0197106972336769,0.0673912987112999,0.1215768903493881,62,217,11,5,6156,6001,0,0,0,0,"tensor([ 3, 3, 3, 7, 9, 6, 12, 9, 6, 3, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 25,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_25/,autoencoders/matryoshka_chess/trainer_25/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,120.55999755859376,68.23088073730469,1.2384333610534668,0.093017578125,0.9847227334976196,0.9866156578063964,0.9945690631866456,0.2971398532390594,0.3011469542980194,3.4657371044158936,0.9987353682518004,6668,20000,1280000,4,150.03372192382812,21.013246536254883,0.5901918411254883,0.6644887328147888,0.7829368114471436,549712,651392,33113,29189,730288,628608,8027,12484,7918,12359,"tensor([23262, 22903, 21263, 20645, 20126, 18625, 17524, 15205, 11035, 6317, 1716], device='cuda:0')","tensor([147, 149, 214, 320, 353, 373, 379, 316, 202, 56, 7], device='cuda:0')",20000,578762,3,150.03372192382812,33.855316162109375,0.5662063360214233,0.7083566188812256,0.8240088224411011,233756,324291,13174,12562,345006,254471,669,1474,640,1467,"tensor([10066, 9868, 9243, 8969, 8705, 7955, 7455, 6518, 4876, 3046, 849], device='cuda:0')","tensor([145, 147, 209, 312, 340, 362, 367, 303, 193, 51, 6], device='cuda:0')",20000,221620,4,150.03372192382812,21.013246536254883,0.2607400417327881,0.6235765814781189,0.7997939586639404,33430,101006,1374,1331,188190,120614,57,385,57,382,"tensor([500, 532, 610, 817, 906, 949, 920, 784, 555, 262, 71], device='cuda:0')","tensor([145, 146, 205, 309, 338, 361, 367, 303, 193, 51, 6], device='cuda:0')",20000,1280000,2,150.03372192382812,56.04344940185547,0.6212394833564758,0.7115893363952637,0.8099005818367004,592746,727023,35523,36355,687254,552977,10368,18091,10343,18038,"tensor([24498, 24120, 22318, 21628, 21035, 19472, 18339, 15896, 11445, 6395, 1716], device='cuda:0')","tensor([130, 152, 213, 252, 237, 224, 203, 160, 89, 25, 2], device='cuda:0')",20000,1922,5,150.03372192382812,12.681163787841797,0.0387162454426288,0.0967423543334007,0.153036817908287,38,98,3,6,1884,1824,0,0,0,0,"tensor([2, 2, 2, 2, 1, 5, 4, 4, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,150.03372192382812,33.855316162109375,0.6422385573387146,0.8833078145980835,0.7709549069404602,318690,535781,15507,19105,339548,122457,0,0,0,0,"tensor([30293, 28476, 25580, 23713, 21984, 19739, 17567, 13921, 8581, 3404, 770], device='cuda:0')","tensor([35, 35, 56, 73, 77, 78, 75, 61, 44, 9, 2], device='cuda:0')",20000,392,3,150.03372192382812,33.855316162109375,0.8583691120147705,0.996178388595581,0.9800000190734864,300,391,7,2,92,1,0,0,0,0,"tensor([19, 19, 20, 20, 14, 13, 8, 7, 5, 1, 0], device='cuda:0')","tensor([19, 19, 20, 20, 14, 13, 8, 7, 5, 1, 0], device='cuda:0')",20000,434590,3,150.03372192382812,33.855316162109375,0.5292176008224487,0.5432759523391724,0.6886855959892273,160037,165377,10179,8847,274553,269213,0,0,0,0,"tensor([6304, 6189, 5929, 5894, 5995, 5673, 5375, 4676, 3466, 1904, 510], device='cuda:0')","tensor([12, 11, 21, 27, 31, 34, 35, 29, 14, 3, 0], device='cuda:0')",20000,7,0,150.03372192382812,150.03372192382812,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,150.03372192382812,150.03372192382812,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,2,150.03372192382812,56.04344940185547,0.850524365901947,0.8687759637832642,0.8857263326644897,8151,8567,474,613,2391,1975,0,0,0,0,"tensor([401, 391, 360, 333, 301, 256, 235, 195, 158, 102, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,1,150.03372192382812,96.82791900634766,0.7981420159339905,0.8041157126426697,0.8478654623031616,7131,7307,440,569,3167,2991,0,0,0,0,"tensor([390, 380, 350, 323, 290, 252, 229, 192, 155, 100, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,1,150.03372192382812,96.82791900634766,0.8326486945152283,0.8355091214179993,0.8714369535446167,7702,7840,473,602,2623,2485,0,0,0,0,"tensor([398, 388, 355, 328, 299, 254, 233, 194, 158, 101, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,150.03372192382812,6.701959133148193,0.0,0.7956989407539368,0.7956989407539368,0,37,0,3,53,16,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')",20000,443761,4,150.03372192382812,21.013246536254883,0.5450935959815979,0.5690000653266907,0.7021014094352722,170248,180012,10647,8958,273513,263749,0,0,0,0,"tensor([6690, 6629, 6274, 6272, 6300, 5913, 5561, 4830, 3544, 1932, 510], device='cuda:0')","tensor([15, 14, 23, 30, 37, 34, 34, 29, 14, 3, 0], device='cuda:0')",20000,0,0,150.03372192382812,150.03372192382812,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,4,150.03372192382812,21.013246536254883,0.1655730903148651,0.1995060443878173,0.3278233706951141,593,727,43,34,5934,5800,0,0,0,0,"tensor([19, 21, 21, 26, 32, 31, 30, 26, 19, 18, 11], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,150.03372192382812,96.82791900634766,0.7339465022087097,0.7455965876579285,0.8281008005142212,8538,8826,517,638,5673,5385,0,0,0,0,"tensor([512, 503, 454, 417, 390, 354, 321, 276, 194, 109, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,150.03372192382812,150.03372192382812,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,5,150.03372192382812,12.681163787841797,0.1578947305679321,0.4627451300621032,0.5729729533195496,33,118,0,7,352,267,0,0,0,0,"tensor([1, 2, 2, 2, 2, 3, 3, 3, 3, 1, 0], device='cuda:0')","tensor([1, 2, 2, 2, 2, 3, 3, 3, 3, 1, 0], device='cuda:0')",20000,18325,4,150.03372192382812,21.013246536254883,0.9565514922142028,0.9603241682052612,0.9562948346138,18119,18250,1440,1433,206,75,0,0,0,0,"tensor([886, 888, 802, 752, 711, 656, 611, 509, 330, 128, 27], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,150.03372192382812,150.03372192382812,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,6,150.03372192382812,6.701959133148193,0.0038504730910062,0.0378489233553409,0.0749075263738632,12,120,3,3,6206,6098,0,0,0,0,"tensor([1, 2, 2, 5, 6, 7, 7, 6, 5, 3, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 26,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_26/,autoencoders/matryoshka_chess/trainer_26/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,147.75999450683594,78.40619659423828,1.135991454124451,0.095703125,0.987028181552887,0.9886846542358398,0.9965290427207948,0.2971398532390594,0.300556480884552,3.4657371044158936,0.9989217519760132,6137,20000,1280000,3,177.46226501464844,37.72628402709961,0.575646698474884,0.6411548852920532,0.759188175201416,528444,617502,27557,28716,751556,662498,6788,11927,6715,11769,"tensor([20875, 20907, 19665, 19214, 18270, 17405, 16903, 15096, 11064, 6660, 1980], device='cuda:0')","tensor([182, 189, 229, 307, 348, 346, 324, 267, 173, 50, 9], device='cuda:0')",20000,578762,4,177.46226501464844,22.74061584472656,0.5559315085411072,0.6811251044273376,0.7920534014701843,226832,304027,10449,9931,351930,274735,417,812,412,811,"tensor([9115, 9049, 8633, 8437, 7939, 7449, 7247, 6550, 4997, 3227, 986], device='cuda:0')","tensor([174, 180, 221, 296, 340, 336, 315, 258, 163, 44, 6], device='cuda:0')",20000,221620,4,177.46226501464844,22.74061584472656,0.2788950502872467,0.6024734973907471,0.7495589852333069,36119,96087,1276,1268,185501,125533,75,351,74,350,"tensor([573, 576, 652, 796, 881, 869, 862, 739, 506, 256, 82], device='cuda:0')","tensor([174, 180, 218, 292, 337, 334, 315, 258, 163, 44, 6], device='cuda:0')",20000,1280000,3,177.46226501464844,37.72628402709961,0.6009732484817505,0.6898259520530701,0.7917348742485046,562446,689688,29338,29912,717554,590312,8442,15829,8430,15801,"tensor([21926, 21998, 20596, 20053, 19089, 18192, 17678, 15695, 11404, 6724, 1980], device='cuda:0')","tensor([146, 165, 194, 222, 216, 205, 174, 135, 87, 19, 3], device='cuda:0')",20000,1922,5,177.46226501464844,12.983430862426758,0.0337595902383327,0.1032956168055534,0.1769411712884903,33,105,0,6,1889,1817,0,0,0,0,"tensor([1, 1, 1, 2, 3, 4, 5, 4, 2, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,177.46226501464844,37.72628402709961,0.5816655158996582,0.8776938319206238,0.7203654050827026,275464,529094,13454,18314,382774,129144,0,0,0,0,"tensor([27262, 25986, 23332, 21859, 20183, 18581, 16482, 12865, 7950, 3441, 875], device='cuda:0')","tensor([42, 44, 52, 62, 64, 68, 69, 51, 34, 9, 2], device='cuda:0')",20000,392,3,177.46226501464844,37.72628402709961,0.8012048006057739,0.9987229108810424,0.9727047681808472,266,391,6,0,126,1,0,0,0,0,"tensor([13, 13, 17, 16, 14, 13, 12, 8, 5, 1, 0], device='cuda:0')","tensor([13, 13, 17, 16, 14, 13, 12, 8, 5, 1, 0], device='cuda:0')",20000,434590,3,177.46226501464844,37.72628402709961,0.5204265117645264,0.5310378074645996,0.6663325428962708,155817,160144,8398,8402,278773,274446,0,0,0,0,"tensor([5786, 5716, 5579, 5659, 5590, 5348, 5188, 4674, 3389, 2017, 578], device='cuda:0')","tensor([22, 23, 25, 29, 30, 26, 21, 22, 16, 5, 0], device='cuda:0')",20000,7,0,177.46226501464844,177.46226501464844,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,177.46226501464844,177.46226501464844,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,177.46226501464844,37.72628402709961,0.8157323002815247,0.9648117423057556,0.9322776198387146,7508,10186,358,387,3034,356,0,0,0,0,"tensor([341, 340, 324, 299, 274, 248, 233, 203, 159, 107, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,3,177.46226501464844,37.72628402709961,0.7886554002761841,0.9385746717453004,0.9264212250709534,6924,9443,337,381,3374,855,0,0,0,0,"tensor([331, 329, 311, 292, 267, 242, 226, 199, 156, 107, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,177.46226501464844,37.72628402709961,0.7960748672485352,0.9468016624450684,0.9279139637947084,7058,9584,349,336,3267,741,0,0,0,0,"tensor([337, 336, 317, 297, 274, 246, 232, 203, 159, 107, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,177.46226501464844,177.46226501464844,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,2,177.46226501464844,63.359466552734375,0.538964569568634,0.5543190240859985,0.6815083622932434,167110,173909,9244,9799,276651,269852,0,0,0,0,"tensor([6091, 6098, 5852, 5905, 5815, 5572, 5404, 4845, 3484, 2036, 578], device='cuda:0')","tensor([25, 26, 25, 28, 30, 26, 20, 22, 16, 6, 0], device='cuda:0')",20000,0,0,177.46226501464844,177.46226501464844,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,5,177.46226501464844,12.983430862426758,0.1570282876491546,0.2038861662149429,0.2982051372528076,558,745,22,36,5969,5782,0,0,0,0,"tensor([12, 11, 15, 23, 25, 30, 29, 25, 24, 20, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,177.46226501464844,109.73014831542967,0.7117882966995239,0.715249240398407,0.814017117023468,8082,8166,416,457,6129,6045,0,0,0,0,"tensor([456, 454, 419, 392, 357, 317, 315, 277, 209, 112, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,177.46226501464844,177.46226501464844,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,7,177.46226501464844,2.601357698440552,0.0,0.2964601516723633,0.4204081296920776,0,67,0,0,385,318,0,0,0,0,"tensor([0, 0, 1, 2, 1, 1, 1, 2, 3, 0, 0], device='cuda:0')","tensor([0, 0, 1, 2, 1, 1, 1, 2, 3, 0, 0], device='cuda:0')",20000,18325,4,177.46226501464844,22.74061584472656,0.9552127122879028,0.9594064950942992,0.9562948346138,17862,18234,1212,1452,463,91,0,0,0,0,"tensor([763, 792, 704, 670, 650, 612, 581, 473, 296, 132, 31], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,177.46226501464844,177.46226501464844,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,7,177.46226501464844,2.601357698440552,0.0076873796060681,0.0449544191360473,0.07986431568861,24,143,2,1,6194,6075,0,0,0,0,"tensor([3, 3, 3, 8, 8, 7, 6, 9, 4, 2, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 27,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_27/,autoencoders/matryoshka_chess/trainer_27/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,168.9199981689453,86.60303497314453,1.0624375343322754,0.093505859375,0.9888317584991456,0.9906690716743468,0.997834324836731,0.2971398532390594,0.3005910813808441,3.4657371044158936,0.9989108443260192,5420,20000,1280000,3,209.24620056152344,39.10197448730469,0.5396189093589783,0.6048499345779419,0.7372279167175293,481390,565571,22795,24549,798610,714429,5391,9162,5353,9004,"tensor([17811, 18084, 17294, 16163, 16051, 15071, 14425, 12293, 8768, 5590, 1662], device='cuda:0')","tensor([157, 161, 186, 239, 272, 278, 258, 214, 126, 36, 5], device='cuda:0')",20000,578762,3,209.24620056152344,39.10197448730469,0.5183926820755005,0.6472002863883972,0.7801350355148315,205530,281503,8659,9645,373232,297259,301,972,292,969,"tensor([7929, 7951, 7664, 7161, 7096, 6525, 6225, 5404, 3998, 2722, 825], device='cuda:0')","tensor([151, 155, 179, 231, 263, 271, 249, 205, 121, 31, 3], device='cuda:0')",20000,221620,4,209.24620056152344,21.98604393005371,0.2231439054012298,0.5860040187835693,0.7251465916633606,27950,92276,941,1037,193670,129344,63,214,61,214,"tensor([505, 495, 557, 640, 725, 711, 698, 579, 400, 210, 63], device='cuda:0')","tensor([151, 153, 178, 229, 262, 269, 249, 205, 121, 31, 3], device='cuda:0')",20000,1280000,2,209.24620056152344,70.66311645507812,0.5606698393821716,0.664579451084137,0.7729752659797668,508003,652086,24126,30316,771997,627914,6115,12595,6112,12564,"tensor([18566, 18917, 18053, 16833, 16685, 15710, 15044, 12784, 9010, 5644, 1662], device='cuda:0')","tensor([112, 122, 153, 166, 162, 152, 138, 110, 53, 16, 2], device='cuda:0')",20000,1922,2,209.24620056152344,70.66311645507812,0.1017612591385841,0.1228834018111229,0.1891891956329345,104,127,18,18,1818,1795,0,0,0,0,"tensor([1, 1, 2, 1, 3, 3, 3, 3, 1, 0, 0], device='cuda:0')","tensor([1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,209.24620056152344,39.10197448730469,0.555079996585846,0.8594214916229248,0.6922053098678589,257702,509016,12582,17301,400536,149222,0,0,0,0,"tensor([23284, 22288, 20159, 18423, 17336, 15815, 13903, 10414, 6064, 2822, 716], device='cuda:0')","tensor([51, 49, 43, 56, 56, 53, 52, 51, 25, 9, 2], device='cuda:0')",20000,392,3,209.24620056152344,39.10197448730469,0.7590551376342773,0.9420654773712158,0.9422110319137572,241,374,2,28,151,18,0,0,0,0,"tensor([11, 11, 11, 16, 13, 13, 10, 9, 5, 1, 0], device='cuda:0')","tensor([11, 11, 11, 16, 13, 13, 10, 9, 5, 1, 0], device='cuda:0')",20000,434590,2,209.24620056152344,70.66311645507812,0.4841128289699554,0.4949504435062408,0.6330334544181824,140925,145460,6684,7726,293665,289130,0,0,0,0,"tensor([5067, 5010, 5018, 4856, 4926, 4588, 4405, 3728, 2707, 1720, 488], device='cuda:0')","tensor([17, 17, 20, 21, 19, 17, 18, 16, 11, 4, 0], device='cuda:0')",20000,7,0,209.24620056152344,209.24620056152344,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,209.24620056152344,209.24620056152344,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,5,209.24620056152344,11.954604148864746,0.7549286484718323,0.9319085478782654,0.9198338985443116,6529,9724,226,603,4013,818,0,0,0,0,"tensor([299, 302, 291, 261, 245, 224, 204, 174, 129, 90, 26], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,6,209.24620056152344,5.638350009918213,0.7424405813217163,0.842695415019989,0.8790125846862793,6212,7741,224,333,4086,2557,0,0,0,0,"tensor([293, 297, 287, 260, 244, 221, 202, 171, 126, 90, 26], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,6,209.24620056152344,5.638350009918213,0.7484123706817627,0.8468761444091797,0.8882076740264893,6305,7801,219,297,4020,2524,0,0,0,0,"tensor([297, 299, 289, 259, 244, 221, 204, 174, 129, 90, 26], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,8,209.24620056152344,0.9024306535720824,0.0,0.3939394056797027,0.3939394056797027,0,13,0,0,53,40,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0], device='cuda:0')",20000,443761,2,209.24620056152344,70.66311645507812,0.4992185533046722,0.5179296731948853,0.6488246321678162,150129,158040,7566,8475,293632,285721,0,0,0,0,"tensor([5242, 5328, 5229, 5025, 5099, 4799, 4620, 3886, 2787, 1728, 488], device='cuda:0')","tensor([16, 16, 19, 19, 19, 17, 18, 16, 12, 4, 0], device='cuda:0')",20000,0,0,209.24620056152344,209.24620056152344,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,4,209.24620056152344,21.98604393005371,0.098198726773262,0.1300998479127884,0.2139951288700103,338,456,19,27,6189,6071,0,0,0,0,"tensor([12, 9, 11, 16, 22, 20, 23, 20, 18, 15, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,1,209.24620056152344,127.13265228271484,0.6797564029693604,0.7022545337677002,0.8020559549331665,7478,8005,313,582,6733,6206,0,0,0,0,"tensor([376, 386, 363, 311, 304, 275, 254, 220, 159, 97, 26], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,209.24620056152344,209.24620056152344,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,5,209.24620056152344,11.954604148864746,0.0985221713781356,0.3815513849258423,0.550561785697937,20,91,1,1,365,294,0,0,0,0,"tensor([2, 2, 2, 3, 2, 2, 3, 3, 1, 1, 0], device='cuda:0')","tensor([2, 2, 2, 3, 2, 2, 3, 3, 1, 1, 0], device='cuda:0')",20000,18325,3,209.24620056152344,39.10197448730469,0.9347127676010132,0.9576976895332336,0.9563447833061218,17166,18236,1239,1522,1159,89,0,0,0,0,"tensor([613, 647, 595, 540, 538, 512, 475, 386, 227, 109, 26], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,209.24620056152344,209.24620056152344,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,3,209.24620056152344,39.10197448730469,0.0105583108961582,0.042138360440731,0.0718155056238174,33,134,0,8,6185,6084,0,0,0,0,"tensor([3, 3, 4, 7, 9, 7, 6, 3, 3, 2, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 28,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_28/,autoencoders/matryoshka_chess/trainer_28/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,189.9199981689453,100.08565521240234,0.9979447722434998,0.09375,0.990258514881134,0.9919425249099731,0.9977885484695436,0.2971398532390594,0.3009804785251617,3.4657371044158936,0.9987878799438475,4541,20000,1280000,3,237.9888153076172,43.16281509399414,0.5007963180541992,0.5554195642471313,0.6898494362831116,433458,500753,17617,22399,846542,779247,3073,5366,3057,5293,"tensor([13878, 14499, 13963, 13336, 12537, 12439, 11745, 10388, 7383, 4826, 1280], device='cuda:0')","tensor([117, 120, 133, 162, 178, 189, 169, 155, 81, 30, 5], device='cuda:0')",20000,578762,3,237.9888153076172,43.16281509399414,0.4736703932285309,0.5744412541389465,0.7168382406234741,181515,236789,6142,8864,397247,341973,167,471,161,467,"tensor([6230, 6429, 6277, 5976, 5525, 5405, 5084, 4510, 3362, 2329, 636], device='cuda:0')","tensor([112, 115, 127, 156, 172, 181, 165, 149, 79, 27, 4], device='cuda:0')",20000,221620,4,237.9888153076172,23.83254814147949,0.1730168461799621,0.462470531463623,0.6262403726577759,21052,66944,680,942,200568,154676,36,203,35,202,"tensor([411, 416, 453, 511, 547, 562, 531, 474, 313, 192, 53], device='cuda:0')","tensor([112, 115, 127, 154, 170, 179, 164, 149, 79, 27, 4], device='cuda:0')",20000,1280000,2,237.9888153076172,79.67471313476562,0.5192328691482544,0.60788494348526,0.7317911982536316,455375,569490,18655,24187,824625,710510,3376,7752,3375,7743,"tensor([14453, 15121, 14534, 13823, 13045, 12913, 12244, 10791, 7587, 4874, 1280], device='cuda:0')","tensor([ 85, 90, 104, 119, 112, 107, 92, 82, 36, 12, 1], device='cuda:0')",20000,1922,7,237.9888153076172,2.329587459564209,0.0,0.0377743765711784,0.0643539503216743,0,37,0,0,1922,1885,0,0,0,0,"tensor([0, 0, 0, 2, 2, 1, 2, 3, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,237.9888153076172,43.16281509399414,0.5778189301490784,0.8329300880432129,0.6902800798416138,272346,481606,12085,16570,385892,176632,0,0,0,0,"tensor([19659, 18966, 16948, 15566, 14438, 13340, 11552, 8921, 5078, 2516, 572], device='cuda:0')","tensor([68, 39, 38, 21, 31, 37, 36, 42, 18, 7, 2], device='cuda:0')",20000,392,5,237.9888153076172,12.634196281433104,0.5290806889533997,0.7796101570129395,0.8342857360839844,141,260,0,15,251,132,0,0,0,0,"tensor([6, 6, 6, 5, 5, 7, 6, 4, 1, 0, 0], device='cuda:0')","tensor([6, 6, 6, 5, 5, 7, 6, 4, 1, 0, 0], device='cuda:0')",20000,434590,2,237.9888153076172,79.67471313476562,0.4420219659805298,0.4680204093456268,0.6026066541671753,124726,134770,5027,6555,309864,299820,0,0,0,0,"tensor([4013, 4082, 4104, 4037, 3841, 3777, 3547, 3138, 2229, 1460, 385], device='cuda:0')","tensor([ 9, 9, 11, 12, 15, 16, 10, 14, 5, 2, 0], device='cuda:0')",20000,7,0,237.9888153076172,237.9888153076172,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,237.9888153076172,237.9888153076172,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,2,237.9888153076172,79.67471313476562,0.6971171498298645,0.7864621877670288,0.8724534511566162,5731,6948,169,179,4811,3594,0,0,0,0,"tensor([226, 234, 222, 206, 183, 171, 161, 138, 105, 78, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,2,237.9888153076172,79.67471313476562,0.6899530291557312,0.782990574836731,0.8451013565063477,5511,6776,166,234,4787,3522,0,0,0,0,"tensor([219, 226, 217, 204, 180, 169, 157, 134, 105, 77, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,2,237.9888153076172,79.67471313476562,0.700402557849884,0.7923076152801514,0.8716246485710144,5654,6901,166,194,4671,3424,0,0,0,0,"tensor([225, 233, 221, 205, 183, 170, 159, 138, 104, 77, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,237.9888153076172,5.921726703643799,0.0,0.5128205418586731,0.5128205418586731,0,20,0,5,53,33,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0], device='cuda:0')",20000,443761,3,237.9888153076172,43.16281509399414,0.4541198313236236,0.4993244707584381,0.6279360055923462,132056,150059,5774,7228,311705,293702,0,0,0,0,"tensor([4115, 4286, 4243, 4172, 4013, 3946, 3766, 3292, 2303, 1476, 385], device='cuda:0')","tensor([ 8, 8, 9, 10, 14, 17, 10, 14, 5, 3, 0], device='cuda:0')",20000,0,0,237.9888153076172,237.9888153076172,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,3,237.9888153076172,43.16281509399414,0.0994041487574577,0.1512415409088134,0.2072158008813858,342,536,12,25,6185,5991,0,0,0,0,"tensor([ 9, 9, 14, 20, 20, 22, 27, 25, 17, 18, 8], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,2,237.9888153076172,79.67471313476562,0.6474907398223877,0.7178072929382324,0.7867228388786316,6922,8197,248,431,7289,6014,0,0,0,0,"tensor([291, 300, 281, 264, 229, 223, 212, 182, 135, 84, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,237.9888153076172,237.9888153076172,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,4,237.9888153076172,23.83254814147949,0.2516853511333465,0.4171779155731201,0.5283019542694092,56,102,4,2,329,283,0,0,0,0,"tensor([2, 2, 3, 2, 4, 4, 3, 2, 1, 0, 0], device='cuda:0')","tensor([2, 2, 3, 2, 4, 4, 3, 2, 1, 0, 0], device='cuda:0')",20000,18325,3,237.9888153076172,43.16281509399414,0.9353171586990356,0.9578417539596558,0.9563198089599608,17099,18267,1139,1550,1226,58,0,0,0,0,"tensor([458, 496, 454, 438, 415, 431, 397, 322, 189, 92, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,237.9888153076172,237.9888153076172,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,4,237.9888153076172,23.83254814147949,0.0153085626661777,0.0452190339565277,0.0744516476988792,48,144,5,7,6170,6074,0,0,0,0,"tensor([4, 4, 3, 3, 7, 7, 7, 7, 2, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 29,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_29/,autoencoders/matryoshka_chess/trainer_29/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,208.9199981689453,109.62589263916016,0.9402374029159546,0.0888671875,0.9915042519569396,0.993102252483368,0.9997603297233582,0.2971398532390594,0.3001911044120788,3.4657371044158936,0.9990370273590088,4016,20000,1280000,4,263.437255859375,25.239233016967773,0.4689940214157104,0.5420897006988525,0.6766989827156067,396575,483322,14598,19859,883425,796678,2454,4264,2441,4231,"tensor([13403, 14420, 13381, 13044, 12297, 11921, 11344, 9025, 6409, 4693, 1524], device='cuda:0')","tensor([108, 113, 116, 157, 167, 176, 140, 103, 57, 24, 6], device='cuda:0')",20000,578762,4,263.437255859375,25.239233016967773,0.4391578733921051,0.562748908996582,0.7006731033325195,164211,229489,4872,7349,414551,349273,122,192,117,189,"tensor([6104, 6438, 6069, 5977, 5520, 5251, 4994, 4038, 3010, 2293, 760], device='cuda:0')","tensor([105, 110, 113, 149, 158, 169, 132, 98, 52, 19, 4], device='cuda:0')",20000,221620,4,263.437255859375,25.239233016967773,0.1280355900526046,0.4385951459407806,0.5947166681289673,15192,62477,497,799,206428,159143,12,81,12,80,"tensor([426, 432, 435, 525, 508, 516, 495, 403, 263, 182, 64], device='cuda:0')","tensor([105, 110, 112, 148, 157, 168, 131, 98, 52, 19, 4], device='cuda:0')",20000,1280000,2,263.437255859375,89.40814971923828,0.4841386675834656,0.5884713530540466,0.7224144339561462,413689,543197,15280,22932,866311,736803,2555,6507,2554,6490,"tensor([13873, 15003, 13843, 13434, 12673, 12324, 11737, 9300, 6545, 4736, 1524], device='cuda:0')","tensor([ 74, 85, 95, 112, 105, 98, 78, 51, 26, 11, 2], device='cuda:0')",20000,1922,6,263.437255859375,5.589289665222168,0.0256673507392406,0.0506842359900474,0.0958024710416793,25,50,1,1,1897,1872,0,0,0,0,"tensor([2, 2, 1, 1, 2, 2, 3, 2, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,263.437255859375,25.239233016967773,0.6345921158790588,0.8270142674446106,0.7492985129356384,311461,475202,11911,15759,346777,183036,0,0,0,0,"tensor([18072, 17672, 15346, 14165, 12990, 12007, 10458, 7063, 4040, 2328, 678], device='cuda:0')","tensor([52, 38, 20, 23, 24, 34, 23, 15, 10, 2, 2], device='cuda:0')",20000,392,3,263.437255859375,47.63780975341797,0.1244019120931625,0.2176871001720428,0.2527716159820556,26,48,0,1,366,344,0,0,0,0,"tensor([2, 2, 2, 4, 2, 2, 1, 1, 2, 0, 0], device='cuda:0')","tensor([2, 2, 2, 4, 2, 2, 1, 1, 2, 0, 0], device='cuda:0')",20000,434590,5,263.437255859375,12.710633277893066,0.4051788747310638,0.4489212930202484,0.585582971572876,111409,127330,3926,5351,323181,307260,0,0,0,0,"tensor([3951, 4105, 3935, 3985, 3743, 3600, 3414, 2711, 1890, 1432, 456], device='cuda:0')","tensor([13, 13, 14, 16, 14, 15, 16, 9, 6, 1, 0], device='cuda:0')",20000,7,0,263.437255859375,263.437255859375,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,263.437255859375,263.437255859375,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,3,263.437255859375,47.63780975341797,0.6480871438980103,0.7768723368644714,0.84548419713974,5116,7007,130,490,5426,3535,0,0,0,0,"tensor([219, 232, 218, 211, 188, 166, 161, 126, 98, 76, 24], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,3,263.437255859375,47.63780975341797,0.6529662609100342,0.7445652484893799,0.8061089515686035,5052,6302,124,328,5246,3996,0,0,0,0,"tensor([217, 229, 212, 208, 187, 165, 157, 123, 98, 76, 24], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,3,263.437255859375,47.63780975341797,0.6569905281066895,0.7837504148483276,0.8282517790794373,5115,6984,131,513,5210,3341,0,0,0,0,"tensor([219, 232, 216, 211, 188, 166, 160, 126, 98, 76, 24], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,263.437255859375,263.437255859375,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,4,263.437255859375,25.239233016967773,0.4199257791042328,0.4742434620857239,0.6063764095306396,119193,139857,4732,6193,324568,303904,0,0,0,0,"tensor([4014, 4294, 4067, 4104, 3872, 3768, 3585, 2852, 1953, 1448, 456], device='cuda:0')","tensor([11, 11, 13, 15, 14, 16, 16, 9, 6, 1, 0], device='cuda:0')",20000,0,0,263.437255859375,263.437255859375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,5,263.437255859375,12.710633277893066,0.1224548444151878,0.1274888962507248,0.2074518799781799,427,445,20,9,6100,6082,0,0,0,0,"tensor([17, 17, 14, 19, 19, 22, 22, 17, 16, 15, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,2,263.437255859375,89.40814971923828,0.6076011061668396,0.7249881029129028,0.7962214350700378,6275,8337,169,451,7936,5874,0,0,0,0,"tensor([280, 299, 267, 250, 233, 216, 207, 165, 119, 80, 24], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,263.437255859375,263.437255859375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,6,263.437255859375,5.589289665222168,0.0,0.2448979616165161,0.3282937407493591,0,54,0,2,385,331,0,0,0,0,"tensor([0, 0, 1, 0, 1, 2, 2, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 1, 0, 1, 2, 2, 1, 0, 0, 0], device='cuda:0')",20000,18325,3,263.437255859375,47.63780975341797,0.872809648513794,0.957627296447754,0.956369698047638,14644,18227,587,1515,3681,98,0,0,0,0,"tensor([416, 475, 406, 392, 370, 371, 353, 261, 153, 89, 24], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,263.437255859375,263.437255859375,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,7,263.437255859375,2.0472211837768555,0.0,0.0325588770210742,0.0525246225297451,0,103,0,6,6218,6115,0,0,0,0,"tensor([0, 0, 1, 3, 6, 6, 6, 7, 5, 2, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 30,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_30/,autoencoders/matryoshka_chess/trainer_30/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,233.1999969482422,126.39087677001952,0.8859893679618835,0.0843505859375,0.9923992156982422,0.9939594268798828,0.9981743693351746,0.2971398532390594,0.299051284790039,3.4657371044158936,0.9993967413902284,3373,20000,1280000,4,290.06231689453125,25.76593399047852,0.4175426065921783,0.5181191563606262,0.647264838218689,340506,454326,10494,19425,939494,825674,1290,3090,1286,3047,"tensor([10737, 11418, 10164, 9807, 9919, 9927, 9064, 7264, 5787, 4146, 1208], device='cuda:0')","tensor([ 68, 71, 73, 90, 107, 111, 95, 72, 36, 15, 4], device='cuda:0')",20000,578762,4,290.06231689453125,25.76593399047852,0.3929964601993561,0.5250239968299866,0.6608385443687439,142372,208523,3412,7052,436390,370239,64,184,61,182,"tensor([5020, 5197, 4693, 4509, 4490, 4423, 3976, 3261, 2728, 2042, 604], device='cuda:0')","tensor([ 67, 70, 71, 87, 101, 104, 91, 68, 32, 12, 3], device='cuda:0')",20000,221620,4,290.06231689453125,25.76593399047852,0.0902032479643821,0.3993740677833557,0.500446081161499,10485,55508,370,847,211135,166112,10,110,10,110,"tensor([337, 336, 342, 372, 418, 417, 360, 285, 220, 161, 48], device='cuda:0')","tensor([ 67, 70, 70, 87, 101, 104, 90, 68, 32, 12, 3], device='cuda:0')",20000,1280000,4,290.06231689453125,25.76593399047852,0.4303209185600281,0.5538417100906372,0.6923090815544128,353891,498537,10886,21750,926109,781463,1397,4676,1396,4672,"tensor([11021, 11764, 10454, 10072, 10218, 10253, 9358, 7490, 5882, 4170, 1208], device='cuda:0')","tensor([38, 45, 55, 62, 68, 68, 55, 41, 18, 9, 1], device='cuda:0')",20000,1922,4,290.06231689453125,25.76593399047852,0.0144628109410405,0.0367159657180309,0.0387162454426288,14,36,0,3,1908,1886,0,0,0,0,"tensor([1, 1, 1, 1, 2, 1, 1, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,290.06231689453125,25.76593399047852,0.6429437398910522,0.8040186166763306,0.7697345614433289,316879,452650,10596,15081,341359,205588,0,0,0,0,"tensor([14887, 14505, 12365, 11349, 10873, 10113, 8436, 5673, 3404, 2000, 536], device='cuda:0')","tensor([10, 10, 10, 13, 18, 20, 18, 13, 6, 2, 0], device='cuda:0')",20000,392,6,290.06231689453125,5.196249485015869,0.1682243049144745,0.4333996176719665,0.6017698645591736,36,109,0,2,356,283,0,0,0,0,"tensor([1, 1, 1, 1, 3, 2, 5, 3, 0, 0, 0], device='cuda:0')","tensor([1, 1, 1, 1, 3, 2, 5, 3, 0, 0, 0], device='cuda:0')",20000,434590,5,290.06231689453125,12.289632797241213,0.3614704310894012,0.4223144948482513,0.5540156960487366,96477,117592,2736,4711,338113,316998,0,0,0,0,"tensor([3245, 3325, 3091, 3057, 3085, 2990, 2696, 2169, 1709, 1225, 364], device='cuda:0')","tensor([ 1, 1, 2, 4, 8, 11, 10, 5, 1, 0, 0], device='cuda:0')",20000,7,0,290.06231689453125,290.06231689453125,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,290.06231689453125,290.06231689453125,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,5,290.06231689453125,12.289632797241213,0.5983898639678955,0.7363195419311523,0.8022657632827759,4534,6378,78,404,6008,4164,0,0,0,0,"tensor([180, 188, 169, 154, 150, 146, 127, 103, 91, 68, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,290.06231689453125,12.289632797241213,0.6069751381874084,0.7361927032470703,0.7823695540428162,4525,6205,87,354,5773,4093,0,0,0,0,"tensor([180, 186, 167, 153, 149, 143, 125, 103, 90, 67, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,5,290.06231689453125,12.289632797241213,0.6070830821990967,0.744373619556427,0.7881853580474854,4534,6367,78,415,5791,3958,0,0,0,0,"tensor([180, 188, 167, 154, 150, 146, 127, 103, 91, 67, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,290.06231689453125,5.196249485015869,0.0,0.5333333611488342,0.5333333611488342,0,20,0,2,53,33,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0], device='cuda:0')",20000,443761,4,290.06231689453125,25.76593399047852,0.3802753090858459,0.4627972245216369,0.577058732509613,105002,135551,3479,6478,338759,308210,0,0,0,0,"tensor([3294, 3470, 3183, 3157, 3196, 3155, 2829, 2250, 1746, 1225, 364], device='cuda:0')","tensor([ 1, 1, 2, 4, 9, 11, 10, 5, 1, 0, 0], device='cuda:0')",20000,0,0,290.06231689453125,290.06231689453125,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,4,290.06231689453125,25.76593399047852,0.0722607299685478,0.1041787564754486,0.1479072421789169,245,359,9,6,6282,6168,0,0,0,0,"tensor([ 9, 8, 9, 14, 18, 18, 17, 17, 15, 12, 4], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,4,290.06231689453125,25.76593399047852,0.5349802374839783,0.7137422561645508,0.7956432700157166,5219,8162,81,498,8992,6049,0,0,0,0,"tensor([212, 223, 198, 183, 183, 173, 158, 129, 94, 68, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,290.06231689453125,290.06231689453125,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,2,290.06231689453125,96.67359161376952,0.0,0.1698113232851028,0.1698113232851028,0,36,0,3,385,349,0,0,0,0,"tensor([0, 0, 2, 1, 1, 1, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 2, 1, 1, 1, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,290.06231689453125,50.41328430175781,0.8481942415237427,0.9568491578102112,0.9564196467399596,13974,18172,651,1486,4351,153,0,0,0,0,"tensor([309, 364, 310, 300, 303, 313, 289, 213, 126, 74, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,290.06231689453125,290.06231689453125,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,4,290.06231689453125,25.76593399047852,0.0146777285262942,0.0461683422327041,0.0709307715296745,46,147,4,3,6172,6071,0,0,0,0,"tensor([2, 2, 6, 6, 7, 7, 6, 2, 2, 2, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 31,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_31/,autoencoders/matryoshka_chess/trainer_31/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,249.3999938964844,139.32669067382812,0.8189090490341187,0.0819091796875,0.9935321807861328,0.9950880408287048,1.000283122062683,0.2971398532390594,0.2986337542533874,3.4657371044158936,0.9995285272598268,2898,20000,1280000,4,316.550537109375,25.241352081298828,0.3893514275550842,0.4737603664398193,0.6103182435035706,311406,403162,8208,18804,968594,876838,666,2423,665,2410,"tensor([10007, 10818, 10143, 8747, 8168, 8111, 7682, 6482, 5138, 3690, 1152], device='cuda:0')","tensor([65, 67, 71, 61, 73, 74, 64, 56, 32, 13, 3], device='cuda:0')",20000,578762,5,316.550537109375,11.549641609191896,0.3584293127059936,0.4687401354312897,0.6040595769882202,126851,179272,2203,6876,451911,399490,15,82,15,80,"tensor([4683, 4908, 4700, 4048, 3749, 3601, 3381, 2954, 2441, 1811, 574], device='cuda:0')","tensor([61, 62, 67, 57, 69, 69, 59, 54, 29, 10, 2], device='cuda:0')",20000,221620,4,316.550537109375,25.241352081298828,0.0770763680338859,0.2193119823932647,0.3254334032535553,8896,27372,320,625,212724,194248,7,66,7,66,"tensor([327, 327, 326, 307, 323, 326, 291, 246, 185, 154, 53], device='cuda:0')","tensor([61, 62, 67, 57, 69, 69, 59, 53, 29, 10, 2], device='cuda:0')",20000,1280000,4,316.550537109375,25.241352081298828,0.400060623884201,0.5062546730041504,0.6493450999259949,322176,440681,8460,20265,957824,839319,694,3043,694,3041,"tensor([10240, 11135, 10418, 8970, 8351, 8325, 7935, 6644, 5220, 3719, 1152], device='cuda:0')","tensor([33, 38, 46, 43, 46, 45, 34, 27, 16, 6, 1], device='cuda:0')",20000,1922,2,316.550537109375,103.15771484375,0.0436991900205612,0.0614300109446048,0.0614300109446048,43,61,3,3,1879,1861,0,0,0,0,"tensor([1, 1, 2, 1, 1, 1, 1, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,316.550537109375,25.241352081298828,0.6219000816345215,0.7582143545150757,0.7298388481140137,301013,410669,8792,14346,357225,247569,0,0,0,0,"tensor([13816, 13579, 11659, 10105, 9202, 8562, 7132, 4717, 2940, 1805, 513], device='cuda:0')","tensor([ 8, 8, 10, 6, 9, 9, 5, 5, 3, 2, 2], device='cuda:0')",20000,392,4,316.550537109375,25.241352081298828,0.0689655244350433,0.2731277346611023,0.4392156898975372,14,62,0,0,378,330,0,0,0,0,"tensor([1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0], device='cuda:0')","tensor([1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0], device='cuda:0')",20000,434590,1,316.550537109375,199.07192993164065,0.3311687111854553,0.3890813589096069,0.5000368356704712,86645,106227,2033,5223,347945,328363,0,0,0,0,"tensor([3083, 3164, 3044, 2675, 2505, 2391, 2239, 1871, 1509, 1117, 348], device='cuda:0')","tensor([ 9, 10, 9, 7, 7, 6, 7, 2, 2, 1, 0], device='cuda:0')",20000,7,0,316.550537109375,316.550537109375,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,316.550537109375,316.550537109375,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,1,316.550537109375,199.07192993164065,0.5498253107070923,0.6832795143127441,0.7916838526725769,4014,5717,45,475,6528,4825,0,0,0,0,"tensor([161, 171, 166, 141, 122, 113, 108, 90, 80, 59, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,1,316.550537109375,199.07192993164065,0.5529115200042725,0.6876292824745178,0.7796045541763306,3950,5653,40,491,6348,4645,0,0,0,0,"tensor([160, 170, 165, 139, 120, 112, 107, 89, 79, 56, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,316.550537109375,25.241352081298828,0.5581201314926147,0.6917044520378113,0.7930294275283813,4014,5645,45,352,6311,4680,0,0,0,0,"tensor([161, 169, 166, 141, 122, 113, 107, 90, 78, 59, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,6,316.550537109375,4.735617637634277,0.0,0.5882353186607361,0.5882353186607361,0,25,0,7,53,28,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0], device='cuda:0')",20000,443761,1,316.550537109375,199.07192993164065,0.3457262516021728,0.4141066074371338,0.5274448394775391,93297,117569,2658,6490,350464,326192,0,0,0,0,"tensor([3117, 3338, 3149, 2763, 2588, 2517, 2370, 1936, 1546, 1118, 348], device='cuda:0')","tensor([ 9, 10, 9, 7, 7, 6, 7, 2, 2, 1, 0], device='cuda:0')",20000,0,0,316.550537109375,316.550537109375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,1,316.550537109375,199.07192993164065,0.1089752838015556,0.1122493147850036,0.1641686409711837,377,389,15,15,6150,6138,0,0,0,0,"tensor([13, 14, 13, 16, 16, 14, 14, 12, 11, 9, 4], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,4,316.550537109375,25.241352081298828,0.4893965721130371,0.7007895112037659,0.7878271341323853,4627,7900,71,435,9584,6311,0,0,0,0,"tensor([190, 205, 192, 163, 147, 142, 132, 116, 91, 62, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,316.550537109375,316.550537109375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,2,316.550537109375,103.15771484375,0.1578947305679321,0.1710213869810104,0.1753554493188858,33,36,0,0,352,349,0,0,0,0,"tensor([2, 2, 3, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([2, 2, 3, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,316.550537109375,51.853397369384766,0.7839460372924805,0.9527359008789062,0.9563674926757812,12081,18021,415,1484,6244,304,0,0,0,0,"tensor([265, 320, 280, 244, 234, 255, 249, 175, 116, 66, 18], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,316.550537109375,316.550537109375,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,2,316.550537109375,103.15771484375,0.0153183341026306,0.0225791074335575,0.0427807494997978,48,71,1,0,6170,6147,0,0,0,0,"tensor([2, 2, 4, 4, 4, 4, 3, 3, 2, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 32,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_32/,autoencoders/matryoshka_chess/trainer_32/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,270.0400085449219,158.26084899902344,0.7615604996681213,0.0760498046875,0.9944090247154236,0.995802879333496,0.9989373683929444,0.2971398532390594,0.2984819710254669,3.4657371044158936,0.999576449394226,2536,20000,1280000,4,342.6788330078125,24.998035430908203,0.3523064851760864,0.4555271863937378,0.5847591161727905,274974,383125,6019,18992,1005026,896875,542,1302,541,1291,"tensor([8574, 9354, 8594, 7958, 7553, 7200, 6860, 5790, 4623, 3736, 1280], device='cuda:0')","tensor([60, 60, 58, 61, 54, 58, 52, 39, 26, 10, 3], device='cuda:0')",20000,578762,5,342.6788330078125,10.46511459350586,0.3302759230136871,0.4324317872524261,0.5601240396499634,114776,161427,1493,6412,463986,417335,16,31,16,31,"tensor([4072, 4360, 3964, 3693, 3489, 3227, 3118, 2693, 2231, 1846, 640], device='cuda:0')","tensor([56, 56, 55, 57, 50, 55, 49, 36, 23, 7, 1], device='cuda:0')",20000,221620,5,342.6788330078125,10.46511459350586,0.0624391250312328,0.0997194275259971,0.1802085638046264,7147,11640,160,195,214473,209980,4,3,4,3,"tensor([299, 295, 278, 284, 264, 268, 248, 208, 172, 143, 58], device='cuda:0')","tensor([56, 56, 55, 57, 50, 55, 49, 36, 23, 7, 1], device='cuda:0')",20000,1280000,4,342.6788330078125,24.998035430908203,0.3603330552577972,0.4810371100902557,0.6204939484596252,282682,411990,6322,20934,997318,868010,617,2105,617,2103,"tensor([8737, 9577, 8806, 8139, 7722, 7373, 7020, 5894, 4672, 3747, 1280], device='cuda:0')","tensor([38, 40, 43, 47, 36, 38, 32, 22, 13, 5, 2], device='cuda:0')",20000,1922,3,342.6788330078125,54.79911422729492,0.0154878674075007,0.0417515262961387,0.0417515262961387,15,41,0,1,1907,1881,0,0,0,0,"tensor([1, 1, 1, 2, 2, 1, 1, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,342.6788330078125,54.79911422729492,0.5571878552436829,0.7464274168014526,0.6860713362693787,256758,400471,6625,14325,401480,257767,0,0,0,0,"tensor([12170, 11918, 10114, 8933, 8059, 7305, 5734, 3851, 2494, 1686, 558], device='cuda:0')","tensor([11, 11, 15, 10, 6, 5, 3, 4, 2, 2, 0], device='cuda:0')",20000,392,0,342.6788330078125,342.6788330078125,0.197247713804245,0.197247713804245,0.2337078601121902,43,43,1,1,349,349,0,0,0,0,"tensor([2, 2, 2, 1, 1, 0, 1, 0, 0, 0, 0], device='cuda:0')","tensor([2, 2, 2, 1, 1, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,434590,3,342.6788330078125,54.79911422729492,0.2917620539665222,0.3756771981716156,0.4958001971244812,74425,101656,1161,4942,360165,332934,0,0,0,0,"tensor([2688, 2783, 2581, 2436, 2278, 2139, 2025, 1732, 1395, 1132, 382], device='cuda:0')","tensor([7, 7, 6, 7, 7, 4, 5, 5, 2, 1, 0], device='cuda:0')",20000,7,0,342.6788330078125,342.6788330078125,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,342.6788330078125,342.6788330078125,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,342.6788330078125,24.998035430908203,0.5165228247642517,0.7010016441345215,0.785036027431488,3681,5914,30,417,6861,4628,0,0,0,0,"tensor([145, 156, 137, 126, 120, 105, 103, 87, 71, 59, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,4,342.6788330078125,24.998035430908203,0.525376558303833,0.7091138958930969,0.7902987003326416,3680,5886,31,417,6618,4412,0,0,0,0,"tensor([145, 156, 136, 126, 119, 103, 102, 86, 69, 59, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,342.6788330078125,24.998035430908203,0.5245084762573242,0.7089337110519409,0.7895931005477905,3681,5904,30,427,6644,4421,0,0,0,0,"tensor([145, 156, 137, 126, 120, 105, 103, 87, 71, 59, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,342.6788330078125,342.6788330078125,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,4,342.6788330078125,24.998035430908203,0.3068590462207794,0.3913086950778961,0.5060732364654541,80734,109208,1701,5199,363027,334553,0,0,0,0,"tensor([2714, 2904, 2694, 2501, 2344, 2230, 2092, 1756, 1400, 1132, 382], device='cuda:0')","tensor([7, 7, 6, 7, 7, 4, 5, 5, 2, 1, 0], device='cuda:0')",20000,0,0,342.6788330078125,342.6788330078125,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,3,342.6788330078125,54.79911422729492,0.0571088604629039,0.0836267620325088,0.1087333783507347,192,285,5,4,6335,6242,0,0,0,0,"tensor([10, 10, 12, 13, 14, 13, 14, 14, 12, 11, 4], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,4,342.6788330078125,24.998035430908203,0.451654851436615,0.7233295440673828,0.7919566035270691,4162,8455,57,712,10049,5756,0,0,0,0,"tensor([157, 170, 151, 144, 132, 119, 112, 100, 77, 61, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,342.6788330078125,342.6788330078125,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,2,342.6788330078125,113.69132232666016,0.1962616890668869,0.2046511620283126,0.2088166922330856,42,44,1,1,343,341,0,0,0,0,"tensor([2, 2, 3, 2, 1, 1, 1, 1, 0, 0, 0], device='cuda:0')","tensor([2, 2, 3, 2, 1, 1, 1, 1, 0, 0, 0], device='cuda:0')",20000,18325,2,342.6788330078125,113.69132232666016,0.6085711717605591,0.9558528065681458,0.9564944505691528,8080,18079,149,1424,10245,246,0,0,0,0,"tensor([212, 259, 236, 216, 204, 218, 203, 145, 89, 63, 20], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,342.6788330078125,342.6788330078125,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,342.6788330078125,342.6788330078125,0.0406235195696353,0.0406235195696353,0.0479699000716209,129,129,4,4,6089,6089,0,0,0,0,"tensor([5, 5, 4, 5, 6, 5, 4, 2, 1, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 33,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_33/,autoencoders/matryoshka_chess/trainer_33/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,289.6399841308594,177.4999542236328,0.7348301410675049,0.0736083984375,0.994851529598236,0.996204674243927,0.9979555010795592,0.2971398532390594,0.2975706458091736,3.4657371044158936,0.9998640418052672,2062,20000,1280000,4,367.7254943847656,23.45791244506836,0.3039734661579132,0.4374254643917084,0.5521547794342041,230093,363749,3809,19387,1049907,916251,261,651,261,642,"tensor([6186, 6580, 6534, 5781, 5554, 5326, 5028, 4401, 3664, 3169, 832], device='cuda:0')","tensor([36, 37, 38, 34, 30, 24, 20, 16, 13, 9, 1], device='cuda:0')",20000,578762,4,367.7254943847656,23.45791244506836,0.2980676293373108,0.406531423330307,0.5187771320343018,101574,149581,1214,7546,477188,429181,0,0,0,0,"tensor([2952, 3026, 3025, 2664, 2558, 2371, 2206, 2052, 1772, 1568, 416], device='cuda:0')","tensor([35, 35, 37, 33, 29, 21, 18, 14, 11, 7, 1], device='cuda:0')",20000,221620,4,367.7254943847656,23.45791244506836,0.0449387691915035,0.0484082475304603,0.0875642746686935,5097,5500,125,114,216523,216120,0,0,0,0,"tensor([210, 206, 203, 192, 184, 161, 149, 138, 126, 121, 34], device='cuda:0')","tensor([35, 35, 37, 33, 29, 21, 18, 14, 11, 7, 1], device='cuda:0')",20000,1280000,4,367.7254943847656,23.45791244506836,0.3079093694686889,0.4647656083106994,0.5818729400634766,233627,394184,3878,22086,1046373,885816,261,1052,261,1043,"tensor([6280, 6737, 6676, 5906, 5688, 5450, 5171, 4491, 3696, 3186, 832], device='cuda:0')","tensor([24, 25, 25, 22, 17, 18, 20, 15, 7, 3, 0], device='cuda:0')",20000,1922,0,367.7254943847656,367.7254943847656,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,367.7254943847656,23.45791244506836,0.4177285432815552,0.7305551171302795,0.5931788682937622,174758,386723,3710,13749,483480,271515,0,0,0,0,"tensor([10172, 9944, 8385, 7132, 6459, 5805, 4530, 2857, 1885, 1434, 358], device='cuda:0')","tensor([34, 6, 7, 7, 4, 2, 0, 2, 0, 0, 0], device='cuda:0')",20000,392,0,367.7254943847656,367.7254943847656,0.054590567946434,0.054590567946434,0.1014492809772491,11,11,0,0,381,381,0,0,0,0,"tensor([1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0], device='cuda:0')","tensor([1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0], device='cuda:0')",20000,434590,4,367.7254943847656,23.45791244506836,0.2593469023704529,0.3584222793579101,0.4601797461509704,64893,95919,951,4720,369697,338671,0,0,0,0,"tensor([1961, 1992, 1986, 1793, 1691, 1555, 1440, 1282, 1090, 939, 241], device='cuda:0')","tensor([5, 6, 4, 5, 5, 2, 1, 0, 0, 0, 0], device='cuda:0')",20000,7,0,367.7254943847656,367.7254943847656,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,367.7254943847656,367.7254943847656,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,367.7254943847656,23.45791244506836,0.4849526882171631,0.6848918795585632,0.7433529496192932,3384,5687,30,378,7158,4855,0,0,0,0,"tensor([106, 108, 105, 90, 84, 80, 71, 66, 57, 49, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,4,367.7254943847656,23.45791244506836,0.4932086765766144,0.693600594997406,0.751350998878479,3377,5674,19,389,6921,4624,0,0,0,0,"tensor([105, 108, 104, 90, 83, 79, 70, 66, 56, 49, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,367.7254943847656,23.45791244506836,0.4926122426986694,0.6932275891304016,0.7503687739372253,3384,5681,30,384,6941,4644,0,0,0,0,"tensor([106, 107, 105, 90, 84, 80, 71, 66, 57, 49, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,4,367.7254943847656,23.45791244506836,0.0,0.5135135054588318,0.5135135054588318,0,19,0,2,53,34,0,0,0,0,"tensor([0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0], device='cuda:0')",20000,443761,4,367.7254943847656,23.45791244506836,0.2611083388328552,0.3892327547073364,0.4801759719848633,66794,108731,1064,6202,376967,335030,0,0,0,0,"tensor([1980, 2087, 2061, 1849, 1771, 1633, 1532, 1325, 1106, 939, 241], device='cuda:0')","tensor([5, 6, 4, 5, 5, 2, 1, 0, 0, 0, 0], device='cuda:0')",20000,0,0,367.7254943847656,367.7254943847656,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,3,367.7254943847656,55.22026824951172,0.0516263842582702,0.0588672496378421,0.0706160441040992,173,198,2,2,6354,6329,0,0,0,0,"tensor([6, 6, 5, 7, 7, 7, 8, 8, 8, 9, 4], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,3,367.7254943847656,55.22026824951172,0.4170689880847931,0.7015016674995422,0.7929491400718689,3758,7988,52,575,10453,6223,0,0,0,0,"tensor([118, 127, 129, 109, 102, 92, 84, 75, 63, 51, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,367.7254943847656,367.7254943847656,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,367.7254943847656,367.7254943847656,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,367.7254943847656,55.22026824951172,0.4397830367088318,0.9553149342536926,0.956449031829834,5189,18172,84,1547,13136,153,0,0,0,0,"tensor([143, 183, 171, 158, 157, 157, 144, 104, 74, 56, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,367.7254943847656,367.7254943847656,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,3,367.7254943847656,55.22026824951172,0.0310323014855384,0.0316555872559547,0.0400315225124359,98,100,0,0,6120,6118,0,0,0,0,"tensor([2, 2, 2, 3, 3, 3, 3, 3, 1, 1, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 34,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_34/,autoencoders/matryoshka_chess/trainer_34/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,313.1600036621094,198.34483337402344,0.6437424421310425,0.072265625,0.9960172772407532,0.997270405292511,0.998173177242279,0.2971398532390594,0.2978134453296661,3.4657371044158936,0.999787449836731,1649,20000,1280000,4,395.8947448730469,20.350048065185547,0.2448130398988723,0.4345688819885254,0.5376999974250793,178762,360499,1634,18612,1101238,919501,183,265,183,265,"tensor([4472, 4631, 5132, 4659, 4441, 4362, 4098, 3729, 2986, 2759, 1216], device='cuda:0')","tensor([18, 18, 20, 18, 17, 13, 12, 12, 5, 4, 2], device='cuda:0')",20000,578762,4,395.8947448730469,20.350048065185547,0.2536940276622772,0.4045960307121277,0.5026280283927917,84180,148580,692,7119,494582,430182,0,7,0,7,"tensor([2172, 2157, 2405, 2184, 2063, 1938, 1844, 1754, 1472, 1368, 608], device='cuda:0')","tensor([18, 18, 19, 17, 16, 12, 11, 11, 4, 3, 2], device='cuda:0')",20000,221620,2,395.8947448730469,126.0859146118164,0.0334078483283519,0.0340729691088199,0.0512980408966541,3766,3842,70,54,217854,217778,0,0,0,0,"tensor([156, 151, 157, 140, 144, 122, 111, 107, 99, 91, 40], device='cuda:0')","tensor([18, 18, 19, 17, 16, 12, 11, 11, 4, 3, 2], device='cuda:0')",20000,1280000,4,395.8947448730469,20.350048065185547,0.2471713423728943,0.4563388526439667,0.5637542009353638,180726,384384,1628,20259,1099274,895616,187,289,187,289,"tensor([4522, 4720, 5220, 4749, 4518, 4461, 4175, 3776, 2996, 2765, 1216], device='cuda:0')","tensor([12, 12, 16, 9, 5, 4, 6, 7, 1, 1, 0], device='cuda:0')",20000,1922,0,395.8947448730469,395.8947448730469,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,395.8947448730469,20.350048065185547,0.3187626004219055,0.7306286096572876,0.487627625465393,125402,386953,3165,14042,532836,271285,0,0,0,0,"tensor([8915, 8602, 7312, 6063, 5349, 4687, 3485, 2165, 1380, 1195, 499], device='cuda:0')","tensor([28, 0, 2, 0, 0, 0, 0, 1, 0, 0, 0], device='cuda:0')",20000,392,2,395.8947448730469,126.0859146118164,0.0,0.0873786434531211,0.1190476194024086,0,18,0,2,392,374,0,0,0,0,"tensor([0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0], device='cuda:0')","tensor([0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0], device='cuda:0')",20000,434590,4,395.8947448730469,20.350048065185547,0.2116124927997589,0.349906712770462,0.4415454864501953,51494,93110,598,4499,383096,341480,0,0,0,0,"tensor([1390, 1370, 1510, 1354, 1294, 1222, 1151, 1064, 877, 806, 359], device='cuda:0')","tensor([4, 4, 5, 4, 1, 2, 2, 2, 1, 0, 0], device='cuda:0')",20000,7,0,395.8947448730469,395.8947448730469,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,395.8947448730469,395.8947448730469,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,5,395.8947448730469,7.338444709777832,0.4094915091991424,0.6176432371139526,0.7078037858009338,2718,4775,15,145,7824,5767,0,0,0,0,"tensor([75, 75, 83, 72, 66, 63, 62, 56, 47, 43, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,395.8947448730469,7.338444709777832,0.4171590805053711,0.62728351354599,0.711739182472229,2718,4773,15,147,7580,5525,0,0,0,0,"tensor([75, 74, 83, 72, 66, 63, 62, 56, 47, 43, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,5,395.8947448730469,7.338444709777832,0.4162964820861816,0.6264349222183228,0.7144106030464172,2718,4775,15,145,7607,5550,0,0,0,0,"tensor([75, 75, 83, 72, 66, 63, 61, 56, 47, 43, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,395.8947448730469,395.8947448730469,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,4,395.8947448730469,20.350048065185547,0.2086052447557449,0.3622669875621795,0.4607357978820801,51734,99230,504,4837,392027,344531,0,0,0,0,"tensor([1398, 1434, 1594, 1430, 1339, 1289, 1218, 1099, 884, 806, 359], device='cuda:0')","tensor([4, 4, 5, 4, 1, 2, 2, 2, 1, 0, 0], device='cuda:0')",20000,0,0,395.8947448730469,395.8947448730469,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,1,395.8947448730469,259.31085205078125,0.0487003289163112,0.0487076044082641,0.0619994066655635,163,163,4,3,6364,6364,0,0,0,0,"tensor([6, 6, 8, 6, 6, 6, 7, 7, 6, 6, 3], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,3,395.8947448730469,53.27312469482422,0.3412415981292724,0.6687576770782471,0.7687246799468994,2927,7356,17,432,11284,6855,0,0,0,0,"tensor([83, 85, 96, 85, 81, 74, 69, 58, 48, 43, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,395.8947448730469,395.8947448730469,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,395.8947448730469,395.8947448730469,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,395.8947448730469,53.27312469482422,0.2948258817195892,0.9549225568771362,0.9563446640968324,3171,18070,15,1451,15154,255,0,0,0,0,"tensor([ 92, 119, 133, 123, 117, 118, 109, 78, 55, 45, 19], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,395.8947448730469,395.8947448730469,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,395.8947448730469,395.8947448730469,0.0213138218969106,0.0213138218969106,0.0241423118859529,67,67,2,2,6151,6151,0,0,0,0,"tensor([3, 3, 3, 4, 4, 2, 1, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 35,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_35/,autoencoders/matryoshka_chess/trainer_35/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,333.2799987792969,223.8944091796875,0.5504840612411499,0.071533203125,0.9969915151596068,0.9981344938278198,0.998697817325592,0.2971398532390594,0.2968572378158569,3.4657371044158936,1.0000892877578735,1399,20000,1280000,4,421.79632568359375,18.984375,0.1968971937894821,0.4303325414657593,0.526475727558136,139810,356549,322,20537,1140190,923451,33,94,33,94,"tensor([2656, 2733, 3405, 3254, 3415, 3672, 3623, 3153, 2402, 2251, 832], device='cuda:0')","tensor([11, 11, 10, 11, 9, 10, 8, 6, 6, 5, 1], device='cuda:0')",20000,578762,4,421.79632568359375,18.984375,0.2149976342916488,0.4055466055870056,0.4911394715309143,69729,149377,158,8531,509033,429385,0,0,0,0,"tensor([1315, 1301, 1592, 1498, 1564, 1676, 1624, 1486, 1182, 1124, 416], device='cuda:0')","tensor([10, 10, 9, 9, 7, 7, 5, 3, 3, 2, 0], device='cuda:0')",20000,221620,7,421.79632568359375,0.8992458581924438,0.0226245746016502,0.0273477658629417,0.0367089472711086,2536,3073,25,42,219084,218547,0,0,0,0,"tensor([90, 89, 98, 90, 85, 84, 86, 92, 72, 73, 32], device='cuda:0')","tensor([10, 10, 9, 9, 7, 7, 5, 3, 3, 2, 0], device='cuda:0')",20000,1280000,4,421.79632568359375,18.984375,0.1971134394407272,0.4515319764614105,0.5514333248138428,139980,379800,319,22473,1140020,900200,33,119,33,119,"tensor([2669, 2760, 3467, 3336, 3493, 3726, 3687, 3194, 2408, 2252, 832], device='cuda:0')","tensor([4, 4, 6, 6, 3, 4, 3, 3, 4, 3, 1], device='cuda:0')",20000,1922,0,421.79632568359375,421.79632568359375,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,421.79632568359375,56.46512985229492,0.1833534985780716,0.7241047620773315,0.4175157248973846,66541,381664,1043,14266,591697,276574,0,0,0,0,"tensor([7921, 7613, 6657, 5506, 4662, 4175, 3269, 1922, 1060, 936, 356], device='cuda:0')","tensor([29, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,7,421.79632568359375,0.8992458581924438,0.0,0.044665016233921,0.044665016233921,0,9,0,2,392,383,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0], device='cuda:0')",20000,434590,4,421.79632568359375,18.984375,0.1646612286567688,0.3405155539512634,0.4250352680683136,39001,90262,121,5297,395589,344328,0,0,0,0,"tensor([804, 810, 986, 907, 956, 992, 953, 876, 690, 649, 247], device='cuda:0')","tensor([1, 1, 1, 2, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,7,0,421.79632568359375,421.79632568359375,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,421.79632568359375,421.79632568359375,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,5,421.79632568359375,6.190450191497803,0.35211381316185,0.6276247501373291,0.696845293045044,2253,4887,2,144,8289,5655,0,0,0,0,"tensor([45, 45, 54, 47, 51, 57, 54, 48, 37, 35, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,421.79632568359375,6.190450191497803,0.3589580357074737,0.6365712285041809,0.7041046023368835,2253,4879,2,152,8045,5419,0,0,0,0,"tensor([45, 45, 53, 47, 51, 57, 54, 48, 37, 35, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,5,421.79632568359375,6.190450191497803,0.3581876158714294,0.6363636255264282,0.7039324641227722,2253,4886,2,145,8072,5439,0,0,0,0,"tensor([45, 45, 54, 47, 51, 57, 53, 47, 37, 35, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,421.79632568359375,421.79632568359375,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,4,421.79632568359375,18.984375,0.1616211682558059,0.3491498827934265,0.4393144249916076,39024,94915,122,5016,404737,348846,0,0,0,0,"tensor([ 808, 832, 1041, 968, 983, 1046, 1009, 902, 690, 649, 247], device='cuda:0')","tensor([1, 1, 1, 2, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,421.79632568359375,421.79632568359375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,3,421.79632568359375,56.46512985229492,0.0277987606823444,0.0334387682378292,0.0340310186147689,92,111,0,1,6435,6416,0,0,0,0,"tensor([3, 3, 3, 4, 3, 3, 3, 3, 3, 3, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,3,421.79632568359375,56.46512985229492,0.2763932049274444,0.6592168807983398,0.754642903804779,2279,7197,1,427,11932,7014,0,0,0,0,"tensor([47, 47, 63, 60, 58, 65, 55, 52, 38, 35, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,421.79632568359375,421.79632568359375,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,421.79632568359375,421.79632568359375,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,421.79632568359375,145.0930633544922,0.2265337705612182,0.9444994330406188,0.9568602442741394,2341,17656,2,1406,15984,669,0,0,0,0,"tensor([ 50, 65, 97, 94, 93, 101, 93, 71, 40, 36, 13], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,421.79632568359375,421.79632568359375,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,2,421.79632568359375,145.0930633544922,0.007046764716506,0.0083226636052131,0.0115052731707692,22,26,4,4,6196,6192,0,0,0,0,"tensor([1, 1, 2, 1, 1, 0, 0, 1, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 36,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_36/,autoencoders/matryoshka_chess/trainer_36/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,353.8399963378906,256.3359680175781,0.4507381021976471,0.0736083984375,0.9978792667388916,0.9988410472869872,1.0004087686538696,0.2971398532390594,0.2970967888832092,3.4657371044158936,1.0000135898590088,1227,20000,1280000,4,445.9081726074219,20.618749618530277,0.1743373870849609,0.4226761758327484,0.5187910795211792,122265,348525,360,20610,1157735,931475,87,50,87,50,"tensor([1469, 1416, 1981, 2209, 2537, 2678, 2467, 2249, 1876, 1684, 636], device='cuda:0')","tensor([3, 3, 4, 4, 4, 4, 3, 4, 3, 3, 0], device='cuda:0')",20000,578762,4,445.9081726074219,20.618749618530277,0.1849286258220672,0.3927224576473236,0.479039192199707,58973,143489,57,8489,519789,435273,0,0,0,0,"tensor([ 726, 673, 898, 955, 1134, 1173, 1056, 1054, 932, 838, 318], device='cuda:0')","tensor([3, 3, 3, 3, 3, 3, 2, 3, 2, 2, 0], device='cuda:0')",20000,221620,7,445.9081726074219,0.8593960404396057,0.0143444649875164,0.0218189619481563,0.0261664260178804,1601,2445,1,52,220019,219175,0,0,0,0,"tensor([37, 36, 43, 42, 38, 40, 39, 41, 40, 39, 17], device='cuda:0')","tensor([3, 3, 3, 3, 3, 3, 2, 3, 2, 2, 0], device='cuda:0')",20000,1280000,4,445.9081726074219,20.618749618530277,0.1751918047666549,0.4402059316635132,0.5423461198806763,122925,367415,394,21872,1157075,912585,87,56,87,56,"tensor([1477, 1432, 2025, 2272, 2610, 2746, 2518, 2266, 1882, 1686, 636], device='cuda:0')","tensor([1, 1, 3, 3, 2, 2, 1, 1, 1, 1, 0], device='cuda:0')",20000,1922,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,3,445.9081726074219,64.04151916503906,0.1762830466032028,0.7152504920959473,0.4021406471729278,63754,374204,1322,13916,594484,284034,0,0,0,0,"tensor([7439, 7020, 6140, 5108, 4114, 3565, 2651, 1345, 805, 685, 253], device='cuda:0')","tensor([72, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,392,392,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,434590,4,445.9081726074219,20.618749618530277,0.1385900825262069,0.3317558765411377,0.4071507751941681,32363,87490,79,5356,402227,347100,0,0,0,0,"tensor([433, 401, 533, 576, 642, 691, 611, 569, 530, 481, 181], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,7,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,5,445.9081726074219,6.169049263000488,0.3012970387935638,0.6318951845169067,0.7026146650314331,1870,4943,1,160,8672,5599,0,0,0,0,"tensor([24, 22, 28, 29, 35, 38, 34, 36, 30, 26, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,445.9081726074219,6.169049263000488,0.3073383271694183,0.6419063210487366,0.709787905216217,1870,4943,1,160,8428,5355,0,0,0,0,"tensor([24, 22, 28, 29, 35, 38, 34, 36, 30, 26, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,5,445.9081726074219,6.169049263000488,0.3066579103469848,0.6400051712989807,0.7094833254814148,1870,4937,1,166,8455,5388,0,0,0,0,"tensor([24, 22, 28, 29, 35, 38, 34, 36, 30, 26, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,4,445.9081726074219,20.618749618530277,0.1409120261669159,0.3573375344276428,0.4381223917007446,33645,97804,126,5839,410116,345957,0,0,0,0,"tensor([434, 418, 583, 634, 701, 742, 656, 605, 531, 481, 181], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,0,445.9081726074219,445.9081726074219,0.0221212115138769,0.0221212115138769,0.0221212115138769,73,73,0,0,6454,6454,0,0,0,0,"tensor([2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,4,445.9081726074219,20.618749618530277,0.2326824963092804,0.7140293121337891,0.7895364761352539,1871,8357,0,840,12340,5854,0,0,0,0,"tensor([24, 22, 35, 39, 48, 46, 37, 35, 30, 27, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,2,445.9081726074219,168.39515686035156,0.2118920981884002,0.945379376411438,0.956412672996521,2172,17611,4,1321,16153,714,0,0,0,0,"tensor([26, 39, 63, 79, 70, 80, 68, 49, 33, 28, 10], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,445.9081726074219,445.9081726074219,0.0,0.0,0.0,0,0,0,0,6218,6218,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 37,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_37/,autoencoders/matryoshka_chess/trainer_37/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,374.2799987792969,287.1025695800781,0.3569938540458679,0.07421875,0.9985251426696776,0.99932461977005,0.9992156624794006,0.2971398532390594,0.2974281311035156,3.4657371044158936,0.9999090433120728,1094,20000,1280000,4,465.9142761230469,26.07852935791016,0.1431032419204712,0.4205040335655212,0.5117353200912476,98647,346025,36,19738,1181353,933975,0,57,0,56,"tensor([1053, 922, 1540, 1440, 1766, 1964, 1979, 1620, 1371, 1183, 576], device='cuda:0')","tensor([1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1], device='cuda:0')",20000,578762,4,465.9142761230469,26.07852935791016,0.1570117771625518,0.3744412958621979,0.4718625545501709,49309,134926,22,6991,529453,443836,0,0,0,0,"tensor([526, 447, 690, 608, 763, 853, 832, 747, 673, 589, 288], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,221620,7,465.9142761230469,0.8181477785110474,0.0107976626604795,0.0152578791603446,0.0208373311907053,1203,1704,3,36,220417,219916,0,0,0,0,"tensor([32, 31, 38, 26, 26, 25, 23, 26, 26, 27, 16], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,1280000,4,465.9142761230469,26.07852935791016,0.1431116312742233,0.4460888206958771,0.5380429029464722,98653,373671,33,21650,1181347,906329,0,97,0,97,"tensor([1056, 927, 1584, 1484, 1846, 2027, 2034, 1648, 1376, 1188, 576], device='cuda:0')","tensor([1, 1, 2, 1, 1, 1, 2, 1, 1, 1, 1], device='cuda:0')",20000,1922,0,465.9142761230469,465.9142761230469,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,465.9142761230469,26.07852935791016,0.0973712652921676,0.7150977253913879,0.4054069519042969,33687,373606,4,13065,624551,284632,0,0,0,0,"tensor([7275, 6789, 6070, 4877, 3955, 3267, 2623, 1173, 603, 487, 230], device='cuda:0')","tensor([31, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0], device='cuda:0')",20000,392,7,465.9142761230469,0.8181477785110474,0.0,0.1055155843496322,0.1448598057031631,0,22,0,3,392,370,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 2, 1, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 2, 1, 0, 0], device='cuda:0')",20000,434590,4,465.9142761230469,26.07852935791016,0.1135931089520454,0.3150636851787567,0.4081656634807586,26171,82136,24,4667,408419,352454,0,0,0,0,"tensor([306, 272, 388, 377, 448, 501, 465, 409, 382, 334, 167], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,7,0,465.9142761230469,465.9142761230469,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,465.9142761230469,465.9142761230469,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,5,465.9142761230469,7.295449256896973,0.2559351325035095,0.6408037543296814,0.7091699242591858,1547,5071,0,214,8995,5471,0,0,0,0,"tensor([17, 14, 23, 17, 26, 26, 29, 26, 22, 18, 9], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,5,465.9142761230469,7.295449256896973,0.26120725274086,0.6503241062164307,0.7153589129447937,1547,5067,0,218,8751,5231,0,0,0,0,"tensor([17, 14, 22, 17, 25, 26, 29, 26, 22, 18, 9], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,5,465.9142761230469,7.295449256896973,0.260613203048706,0.6485586166381836,0.7155187726020813,1547,5062,0,223,8778,5263,0,0,0,0,"tensor([17, 14, 23, 17, 25, 26, 29, 26, 22, 18, 9], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,465.9142761230469,465.9142761230469,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,4,465.9142761230469,26.07852935791016,0.1114231944084167,0.3500731289386749,0.4371112883090973,26182,95386,13,5802,417579,348375,0,0,0,0,"tensor([306, 277, 447, 408, 509, 536, 518, 436, 383, 334, 167], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,465.9142761230469,465.9142761230469,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,2,465.9142761230469,207.0000762939453,0.0064141722396016,0.0221212115138769,0.0221212115138769,21,73,0,0,6506,6454,0,0,0,0,"tensor([1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,3,465.9142761230469,82.9131088256836,0.1963447332382202,0.6826342344284058,0.766923189163208,1547,7681,0,612,12664,6530,0,0,0,0,"tensor([17, 15, 26, 26, 39, 35, 33, 26, 22, 19, 9], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,465.9142761230469,465.9142761230469,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,465.9142761230469,465.9142761230469,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,4,465.9142761230469,26.07852935791016,0.1556964516639709,0.9341382384300232,0.9565263390541076,1547,17176,0,1273,16778,1149,0,0,0,0,"tensor([17, 22, 55, 63, 71, 71, 68, 40, 27, 20, 9], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,465.9142761230469,465.9142761230469,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,465.9142761230469,465.9142761230469,0.0,0.0,0.0,0,0,0,0,6218,6218,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 38,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_38/,autoencoders/matryoshka_chess/trainer_38/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,395.0799865722656,326.6731262207031,0.2592175900936126,0.077392578125,0.9990832805633544,0.9996671676635742,0.9998090863227844,0.2971398532390594,0.2971459031105041,3.4657371044158936,0.9999980926513672,1041,20000,1280000,4,483.04931640625,39.02927780151367,0.1350976228713989,0.4243505299091339,0.5133635401725769,92741,350832,207,22669,1187259,929168,84,41,84,41,"tensor([ 624, 537, 1039, 1211, 1641, 1823, 1922, 1630, 1231, 969, 384], device='cuda:0')","tensor([0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,578762,4,483.04931640625,39.02927780151367,0.1483152061700821,0.3971934616565704,0.4764930009841919,46366,145941,108,10158,532396,432821,0,0,0,0,"tensor([312, 257, 450, 485, 697, 794, 820, 702, 599, 482, 192], device='cuda:0')","tensor([0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,221620,7,483.04931640625,0.8837491273880005,0.0083934683352708,0.0155503051355481,0.0238860230892896,934,1737,0,47,220686,219883,0,0,0,0,"tensor([14, 14, 20, 17, 19, 17, 15, 18, 17, 19, 10], device='cuda:0')","tensor([0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,1280000,4,483.04931640625,39.02927780151367,0.1351063549518585,0.446768194437027,0.5370003581047058,92747,375099,201,24067,1187253,904901,84,47,84,47,"tensor([ 624, 537, 1067, 1249, 1716, 1896, 1982, 1662, 1240, 970, 384], device='cuda:0')","tensor([0, 0, 0, 1, 0, 0, 2, 0, 0, 0, 0], device='cuda:0')",20000,1922,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,483.04931640625,39.02927780151367,0.3662288784980774,0.7129132747650146,0.4620407819747925,148636,371775,4837,12961,509602,286463,0,0,0,0,"tensor([7224, 6918, 6143, 5047, 4001, 3273, 2736, 1472, 533, 392, 156], device='cuda:0')","tensor([44, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,392,392,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,434590,4,483.04931640625,39.02927780151367,0.1049549952149391,0.3132175505161285,0.4044142961502075,24074,81570,85,4692,410516,353020,0,0,0,0,"tensor([170, 146, 261, 280, 366, 456, 461, 389, 334, 266, 106], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,7,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,483.04931640625,39.02927780151367,0.2432522624731063,0.7043740749359131,0.7263383865356445,1460,6071,2,625,9082,4471,0,0,0,0,"tensor([10, 8, 13, 14, 25, 25, 29, 23, 20, 15, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,4,483.04931640625,39.02927780151367,0.2482993155717849,0.6912999153137207,0.719485878944397,1460,5725,2,540,8838,4573,0,0,0,0,"tensor([10, 8, 13, 14, 23, 25, 29, 23, 20, 15, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,483.04931640625,39.02927780151367,0.2477305680513382,0.6907775402069092,0.7195192575454712,1460,5730,2,535,8865,4595,0,0,0,0,"tensor([10, 8, 13, 14, 23, 25, 29, 23, 20, 15, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,4,483.04931640625,39.02927780151367,0.1028979420661926,0.3436027765274048,0.4248223304748535,24074,93216,85,5603,419687,350545,0,0,0,0,"tensor([170, 152, 296, 313, 437, 498, 505, 436, 336, 266, 106], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,0,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,0,483.04931640625,483.04931640625,0.0064141722396016,0.0064141722396016,0.0064141722396016,21,21,0,0,6506,6506,0,0,0,0,"tensor([1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,4,483.04931640625,39.02927780151367,0.1865628659725189,0.6417146921157837,0.7135438919067383,1462,6961,0,523,12749,7250,0,0,0,0,"tensor([10, 8, 18, 20, 31, 35, 34, 28, 20, 16, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,483.04931640625,118.7784652709961,0.1477737873792648,0.9487610459327698,0.9567378163337708,1462,17785,0,1381,16863,540,0,0,0,0,"tensor([10, 15, 47, 66, 70, 63, 59, 49, 22, 16, 6], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,483.04931640625,483.04931640625,0.0,0.0,0.0,0,0,0,0,6218,6218,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')" 39,autoencoders/matryoshka_chess/,autoencoders/matryoshka_chess/trainer_39/,autoencoders/matryoshka_chess/trainer_39/indexing_find_dots_indices_n_inputs_1000_reconstruction.pkl,MatryoshkaBatchTopKTrainer,MatryoshkaBatchTopKSAE,1000,1000,1000,415.8399963378906,354.6701965332031,0.200992539525032,0.082763671875,0.9993649125099182,0.999803900718689,1.0000628232955933,0.2971398532390594,0.2972148954868316,3.4657371044158936,0.9999762773513794,1052,20000,1280000,4,499.2204284667969,49.69258880615234,0.1091414839029312,0.4094038307666778,0.5170976519584656,73883,334261,11,18655,1206117,945739,0,32,0,32,"tensor([ 469, 417, 818, 880, 1346, 1718, 1546, 1365, 921, 798, 320], device='cuda:0')","tensor([0, 0, 0, 0, 3, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,578762,4,499.2204284667969,49.69258880615234,0.1198946163058281,0.370108813047409,0.476701557636261,36908,132959,4,6765,541854,445803,0,0,0,0,"tensor([232, 195, 329, 300, 504, 733, 635, 576, 454, 398, 160], device='cuda:0')","tensor([0, 0, 0, 0, 3, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,221620,7,499.2204284667969,0.8328491449356079,0.00270367693156,0.0104478485882282,0.0167021509259939,300,1164,0,37,221320,220456,0,0,0,0,"tensor([ 6, 6, 9, 8, 15, 10, 7, 13, 14, 9, 6], device='cuda:0')","tensor([0, 0, 0, 0, 3, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,1280000,4,499.2204284667969,49.69258880615234,0.1091820672154426,0.4372316300868988,0.5432928204536438,73912,364050,10,21200,1206088,915950,0,40,0,40,"tensor([ 471, 419, 858, 919, 1431, 1796, 1593, 1396, 927, 798, 320], device='cuda:0')","tensor([0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,1922,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,1922,1922,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,658238,4,499.2204284667969,49.69258880615234,0.5800244808197021,0.7070753574371338,0.5995208024978638,271932,367070,7487,12969,386306,291168,0,0,0,0,"tensor([7408, 7138, 6383, 5369, 4326, 3442, 2686, 1473, 413, 302, 120], device='cuda:0')","tensor([73, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,392,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,392,392,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,434590,4,499.2204284667969,49.69258880615234,0.0835475772619247,0.3101528584957123,0.4044485986232757,18946,80605,2,4581,415644,353985,0,0,0,0,"tensor([128, 107, 187, 181, 301, 398, 352, 320, 247, 215, 89], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,7,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,7,7,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,69,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,69,69,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10542,4,499.2204284667969,49.69258880615234,0.196715697646141,0.6711376905441284,0.7319312691688538,1150,5454,0,257,9392,5088,0,0,0,0,"tensor([ 7, 6, 11, 9, 17, 26, 20, 19, 15, 13, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10298,4,499.2204284667969,49.69258880615234,0.2009084522724151,0.6723660826683044,0.7338337302207947,1150,5348,0,262,9148,4950,0,0,0,0,"tensor([ 7, 6, 11, 9, 16, 26, 20, 19, 15, 13, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,10325,4,499.2204284667969,49.69258880615234,0.2004357427358627,0.672858476638794,0.7349480390548706,1150,5361,0,249,9175,4964,0,0,0,0,"tensor([ 7, 6, 10, 9, 16, 26, 20, 19, 15, 13, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,53,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,53,53,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,443761,4,499.2204284667969,49.69258880615234,0.0818916410207748,0.3376993238925934,0.4259745478630066,18946,91206,2,5194,424815,352555,0,0,0,0,"tensor([128, 112, 228, 233, 378, 458, 385, 348, 249, 215, 89], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], device='cuda:0')",20000,0,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6527,5,499.2204284667969,12.375248908996582,0.0,0.0188192445784807,0.0188192445784807,0,62,0,0,6527,6465,0,0,0,0,"tensor([0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,14211,5,499.2204284667969,12.375248908996582,0.14972984790802,0.6980679035186768,0.7565141320228577,1150,8003,0,715,13061,6208,0,0,0,0,"tensor([ 7, 6, 17, 13, 25, 35, 30, 21, 16, 13, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,0,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,0,0,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,385,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,385,385,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,18325,3,499.2204284667969,147.39488220214844,0.119451992213726,0.9486817121505736,0.9566400051116944,1164,17793,0,1393,17161,532,0,0,0,0,"tensor([ 8, 12, 49, 58, 78, 66, 54, 43, 20, 13, 5], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,2988,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,2988,2988,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')",20000,6218,0,499.2204284667969,499.2204284667969,0.0,0.0,0.0,0,0,0,0,6218,6218,0,0,0,0,"tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')","tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], device='cuda:0')"