idolezal commited on
Commit
68ff3fc
ยท
1 Parent(s): c7b0220

Bokeh figure - added symbol for "ensemble" model type

Browse files
Files changed (1) hide show
  1. analyze_winscore.py +19 -6
analyze_winscore.py CHANGED
@@ -74,19 +74,32 @@ def create_scatter_plot_with_curve_with_variances_named(category, variance_acros
74
  def get_variance_for_model(model_name):
75
  return variance_across_categories.get(model_name, 0) # Default to 0 if model not found
76
 
 
 
 
 
77
  # Get marker sizes and variances for the filtered data
78
- filtered_variances = [get_variance_for_model(mname) for mname in np.array(model_names)[np.in1d(x, x_filtered)]]
79
  marker_sizes_filtered = [scale_variance_to_size(var) for var in filtered_variances]
80
 
81
  # Get marker sizes and variances for the outlier data
82
- outlier_variances = [get_variance_for_model(mname) for mname in np.array(model_names)[np.in1d(x, x_outliers)]]
83
  marker_sizes_outliers = [scale_variance_to_size(var) for var in outlier_variances]
84
 
85
- # Randomly assign symbols to the filtered data points
86
- filtered_symbols = ['circle' if ldb_records[mname]['Type'] == 'chat' else 'triangle' for mname in np.array(model_names)[np.in1d(x, x_filtered)]]
 
 
 
 
 
 
 
 
 
87
 
88
- # Randomly assign symbols to the outlier data points
89
- outlier_symbols = ['circle' if ldb_records[mname]['Type'] == 'chat' else 'triangle' for mname in np.array(model_names)[np.in1d(x, x_outliers)]]
90
 
91
  # Define a color palette with enough colors
92
  stride = len(Turbo256) // len(model_names)
 
74
  def get_variance_for_model(model_name):
75
  return variance_across_categories.get(model_name, 0) # Default to 0 if model not found
76
 
77
+ # Get markers
78
+ filtered_markers = np.array(model_names)[np.in1d(x, x_filtered)]
79
+ outlier_markers = np.array(model_names)[np.in1d(x, x_outliers)]
80
+
81
  # Get marker sizes and variances for the filtered data
82
+ filtered_variances = [get_variance_for_model(mname) for mname in filtered_markers]
83
  marker_sizes_filtered = [scale_variance_to_size(var) for var in filtered_variances]
84
 
85
  # Get marker sizes and variances for the outlier data
86
+ outlier_variances = [get_variance_for_model(mname) for mname in outlier_markers]
87
  marker_sizes_outliers = [scale_variance_to_size(var) for var in outlier_variances]
88
 
89
+ # Assign symbols to the model types
90
+ # https://docs.bokeh.org/en/latest/docs/examples/basic/scatters/markers.html
91
+ _model_type2symbol = {
92
+ 'chat': 'circle',
93
+ 'pretrained': 'triangle',
94
+ 'ensemble': 'star',
95
+ }
96
+ model_type2symbol = lambda model_type: _model_type2symbol.get(model_type, 'diamond')
97
+
98
+ # Assign symbols to the filtered data points
99
+ filtered_symbols = [model_type2symbol(ldb_records[mname]['Type']) for mname in filtered_markers]
100
 
101
+ # Assign symbols to the outlier data points
102
+ outlier_symbols = [model_type2symbol(ldb_records[mname]['Type']) for mname in outlier_markers]
103
 
104
  # Define a color palette with enough colors
105
  stride = len(Turbo256) // len(model_names)