Spaces:
Sleeping
Sleeping
mj-new
commited on
Commit
·
3611c30
1
Parent(s):
ee8e535
removed bigos diagnostic
Browse files
app.py
CHANGED
|
@@ -95,15 +95,20 @@ with analysis_bigos:
|
|
| 95 |
st.dataframe(df_metrics_subset_size)
|
| 96 |
df_metrics_subset_features = extract_stats_for_dataset_card(df_multindex_for_agg, subset, metrics_features, add_total=False)
|
| 97 |
st.dataframe(df_metrics_subset_features)
|
| 98 |
-
|
| 99 |
-
with analysis_bigos_diagnostic:
|
| 100 |
-
dataset_name = "amu-cai/pl-asr-bigos-v2-diagnostic"
|
| 101 |
-
dataset_short_name = "BIGOS diagnostic"
|
| 102 |
-
dataset_version = "V2"
|
| 103 |
|
| 104 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 105 |
# remove "all" subset, which is always the last config type
|
| 106 |
-
dataset_configs.pop()
|
|
|
|
|
|
|
|
|
|
| 107 |
print(dataset_configs)
|
| 108 |
# read the reports for public and secret datasets
|
| 109 |
[stats_dict_public, contents_dict_public] = read_reports(dataset_name)
|
|
@@ -116,7 +121,6 @@ with analysis_bigos_diagnostic:
|
|
| 116 |
# extract metrics from dictionary and convert to various dataframes for easier analysis and visualization
|
| 117 |
#st.header("Summary statistics")
|
| 118 |
|
| 119 |
-
|
| 120 |
st.header("Dataset level metrics")
|
| 121 |
df_sum_stats_agg = extract_stats_to_agg(df_multindex_for_agg, metrics_size)
|
| 122 |
|
|
@@ -155,20 +159,15 @@ with analysis_bigos_diagnostic:
|
|
| 155 |
df_metrics_subset_features = extract_stats_for_dataset_card(df_multindex_for_agg, subset, metrics_features, add_total=False)
|
| 156 |
st.dataframe(df_metrics_subset_features)
|
| 157 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 158 |
|
| 159 |
-
|
| 160 |
-
with analysis_bigos_pelcra:
|
| 161 |
-
|
| 162 |
-
dataset_name = "pelcra/pl-asr-pelcra-for-bigos"
|
| 163 |
-
dataset_short_name = "PELCRA"
|
| 164 |
-
|
| 165 |
-
# local version with granted gated access
|
| 166 |
-
#dataset_configs = get_dataset_config_names(dataset_name,trust_remote_code=True)
|
| 167 |
# remove "all" subset, which is always the last config type
|
| 168 |
-
|
| 169 |
-
|
| 170 |
-
# remote version with hardcoded access
|
| 171 |
-
dataset_configs = ['ul-diabiz_poleval-22', 'ul-spokes_mix_emo-18', 'ul-spokes_mix_luz-18', 'ul-spokes_mix_parl-18', 'ul-spokes_biz_bio-23', 'ul-spokes_biz_int-23', 'ul-spokes_biz_luz-23', 'ul-spokes_biz_pod-23', 'ul-spokes_biz_pres-23', 'ul-spokes_biz_vc-23', 'ul-spokes_biz_vc2-23', 'ul-spokes_biz_wyw-23']
|
| 172 |
print(dataset_configs)
|
| 173 |
# read the reports for public and secret datasets
|
| 174 |
[stats_dict_public, contents_dict_public] = read_reports(dataset_name)
|
|
@@ -181,6 +180,7 @@ with analysis_bigos_pelcra:
|
|
| 181 |
# extract metrics from dictionary and convert to various dataframes for easier analysis and visualization
|
| 182 |
#st.header("Summary statistics")
|
| 183 |
|
|
|
|
| 184 |
st.header("Dataset level metrics")
|
| 185 |
df_sum_stats_agg = extract_stats_to_agg(df_multindex_for_agg, metrics_size)
|
| 186 |
|
|
@@ -218,3 +218,4 @@ with analysis_bigos_pelcra:
|
|
| 218 |
st.dataframe(df_metrics_subset_size)
|
| 219 |
df_metrics_subset_features = extract_stats_for_dataset_card(df_multindex_for_agg, subset, metrics_features, add_total=False)
|
| 220 |
st.dataframe(df_metrics_subset_features)
|
|
|
|
|
|
| 95 |
st.dataframe(df_metrics_subset_size)
|
| 96 |
df_metrics_subset_features = extract_stats_for_dataset_card(df_multindex_for_agg, subset, metrics_features, add_total=False)
|
| 97 |
st.dataframe(df_metrics_subset_features)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 98 |
|
| 99 |
+
#########################################PELCRA################################################
|
| 100 |
+
with analysis_bigos_pelcra:
|
| 101 |
+
|
| 102 |
+
dataset_name = "pelcra/pl-asr-pelcra-for-bigos"
|
| 103 |
+
dataset_short_name = "PELCRA"
|
| 104 |
+
|
| 105 |
+
# local version with granted gated access
|
| 106 |
+
#dataset_configs = get_dataset_config_names(dataset_name,trust_remote_code=True)
|
| 107 |
# remove "all" subset, which is always the last config type
|
| 108 |
+
#dataset_configs.pop()
|
| 109 |
+
|
| 110 |
+
# remote version with hardcoded access
|
| 111 |
+
dataset_configs = ['ul-diabiz_poleval-22', 'ul-spokes_mix_emo-18', 'ul-spokes_mix_luz-18', 'ul-spokes_mix_parl-18', 'ul-spokes_biz_bio-23', 'ul-spokes_biz_int-23', 'ul-spokes_biz_luz-23', 'ul-spokes_biz_pod-23', 'ul-spokes_biz_pres-23', 'ul-spokes_biz_vc-23', 'ul-spokes_biz_vc2-23', 'ul-spokes_biz_wyw-23']
|
| 112 |
print(dataset_configs)
|
| 113 |
# read the reports for public and secret datasets
|
| 114 |
[stats_dict_public, contents_dict_public] = read_reports(dataset_name)
|
|
|
|
| 121 |
# extract metrics from dictionary and convert to various dataframes for easier analysis and visualization
|
| 122 |
#st.header("Summary statistics")
|
| 123 |
|
|
|
|
| 124 |
st.header("Dataset level metrics")
|
| 125 |
df_sum_stats_agg = extract_stats_to_agg(df_multindex_for_agg, metrics_size)
|
| 126 |
|
|
|
|
| 159 |
df_metrics_subset_features = extract_stats_for_dataset_card(df_multindex_for_agg, subset, metrics_features, add_total=False)
|
| 160 |
st.dataframe(df_metrics_subset_features)
|
| 161 |
|
| 162 |
+
"""
|
| 163 |
+
with analysis_bigos_diagnostic:
|
| 164 |
+
dataset_name = "amu-cai/pl-asr-bigos-v2-diagnostic"
|
| 165 |
+
dataset_short_name = "BIGOS diagnostic"
|
| 166 |
+
dataset_version = "V2"
|
| 167 |
|
| 168 |
+
dataset_configs = get_dataset_config_names(dataset_name,trust_remote_code=True)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 169 |
# remove "all" subset, which is always the last config type
|
| 170 |
+
dataset_configs.pop()
|
|
|
|
|
|
|
|
|
|
| 171 |
print(dataset_configs)
|
| 172 |
# read the reports for public and secret datasets
|
| 173 |
[stats_dict_public, contents_dict_public] = read_reports(dataset_name)
|
|
|
|
| 180 |
# extract metrics from dictionary and convert to various dataframes for easier analysis and visualization
|
| 181 |
#st.header("Summary statistics")
|
| 182 |
|
| 183 |
+
|
| 184 |
st.header("Dataset level metrics")
|
| 185 |
df_sum_stats_agg = extract_stats_to_agg(df_multindex_for_agg, metrics_size)
|
| 186 |
|
|
|
|
| 218 |
st.dataframe(df_metrics_subset_size)
|
| 219 |
df_metrics_subset_features = extract_stats_for_dataset_card(df_multindex_for_agg, subset, metrics_features, add_total=False)
|
| 220 |
st.dataframe(df_metrics_subset_features)
|
| 221 |
+
"""
|