Update dashboards to use quickboard v0.4.0 (#165)

rickymagner · web-flow · commit 9d76d93e47f6 · 2024-03-27T13:07:26.000-04:00
diff --git a/BenchmarkSVs/README.md b/BenchmarkSVs/README.md
@@ -70,7 +70,7 @@ The SVisualizer is a python script based on [Dash](https://plotly.com/dash/) and
 
 Follow these steps to ensure your environment is prepared.
 
-1. Make sure you have the Python package `quickboard` installed. It's recommended to pin the version to avoid any breaking changes in the future. The version `quickboard==0.3.5` should work with this current version.
+1. Make sure you have the Python package `quickboard` installed. It's recommended to pin the version to avoid any breaking changes in the future. The version `quickboard==0.4.0` should work with this current version.
 2. Copy all the files from the [SVisualizer](SVisualizer) directory to a fresh directory on your local system. 
 3. Copy all the files from the WDL outputs into a subdirectory called `wdl_outputs`. You can also use the gathering script [provided](#optional-data-gathering-script) to make this step easier.
 
diff --git a/BenchmarkSVs/SVisualizer/SVisualizer.ipynb b/BenchmarkSVs/SVisualizer/SVisualizer.ipynb
@@ -10,7 +10,7 @@
    "outputs": [],
    "source": [
     "import quickboard.base as qbb\n",
-    "from quickboard.app import start_app, deploy_app, app"
+    "from quickboard.app import start_app"
    ]
   },
   {
@@ -231,7 +231,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "start_app(board, app_title='SVisualizer', mode='external', port=8050)"
+    "start_app(board, app_title='SVisualizer', jupyter_mode='external', port=8050)"
    ]
   },
   {
@@ -269,9 +269,9 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "quickboard_venv",
+   "display_name": "Python 3 (ipykernel)",
    "language": "python",
-   "name": "quickboard_venv"
+   "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
@@ -283,7 +283,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.9.6"
+   "version": "3.10.9"
   }
  },
  "nbformat": 4,
diff --git a/BenchmarkSVs/SVisualizer/truvari_tabs.py b/BenchmarkSVs/SVisualizer/truvari_tabs.py
@@ -167,8 +167,9 @@ def make_closest_plot(df, sort_by, asc, mode, disq_values):
     title = f'Counts of Disqualified ({disq_values}) Sites (N = {len(df)})'
     asc = asc == 'Ascending'
     disq_df = make_disqualified_df(df, dist_threshold=500, size_ratio_threshold=0.7, color='Experiment')
+    category_orders = {'Experiment': EXPERIMENT_ORDER} if EXPERIMENT_ORDER is not None else None
     fig = create_upset(disq_df, title=title, sort_by=sort_by, asc=asc, mode=mode, color='Experiment', 
-                       category_orders={'Experiment': EXPERIMENT_ORDER}, color_discrete_sequence=EXPERIMENT_COLORS, 
+                       category_orders=category_orders, color_discrete_sequence=EXPERIMENT_COLORS, 
                        color_discrete_map=EXPERIMENT_COLOR_DICT)
     return fig
 
diff --git a/BenchmarkVCFs/BenchmarkBoard/BenchmarkBoard.ipynb b/BenchmarkVCFs/BenchmarkBoard/BenchmarkBoard.ipynb
@@ -325,6 +325,28 @@
     "    return plot_df"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "6d1433dd-c829-470a-82d5-1eb21cb8b568",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class SubsetConfig:\n",
+    "    def __init__(self, df):\n",
+    "        self.strat = df['Interval'].iloc[0] if len(df) > 0 and 'Interval' in df.columns else None\n",
+    "        self.type_ = df['Type'].iloc[0] if len(df) > 0 else None\n",
+    "        self.color = None if (len(df) > 0) and (df['Experiment'].iloc[0] == 'No_ExpGroups_Provided') else 'Experiment'\n",
+    "\n",
+    "    def make_title(self, prefix):\n",
+    "        title = prefix\n",
+    "        if self.strat is not None:\n",
+    "            title += f' over {self.strat}'\n",
+    "        if self.type_ is not None:\n",
+    "            title += f' for {self.type_}'\n",
+    "        return title"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
@@ -349,32 +371,30 @@
    "outputs": [],
    "source": [
     "def make_prec_recall_plot(df, marginal, axes_mode):\n",
-    "    strat = df['Interval'].iloc[0]\n",
-    "    type_ = df['Type'].iloc[0]\n",
-    "    color = None if df['Experiment'].iloc[0] == 'No_ExpGroups_Provided' else 'Experiment'\n",
+    "    cfg = SubsetConfig(df)\n",
+    "    \n",
     "    if not SINGLE_SAMPLE_MODE:\n",
     "        marginal = marginal.lower() if marginal != 'None' else None\n",
-    "        fig = px.scatter(df, x='Recall', y='Precision', color=color, marginal_x=marginal, marginal_y=marginal,\n",
-    "                          hover_data=['Query_Name'], title=f'Precision vs Recall Plot over {strat} for {type_}', \n",
+    "        fig = px.scatter(df, x='Recall', y='Precision', color=cfg.color, marginal_x=marginal, marginal_y=marginal,\n",
+    "                          hover_data=['Query_Name'], title=cfg.make_title(prefix=f'Precision vs Recall Plot'), \n",
     "                          category_orders=CATEGORY_ORDERS, color_discrete_map=EXPERIMENT_COLOR_MAP)\n",
     "        if axes_mode == 'Fixed':\n",
     "            fig.update_layout(xaxis_range=[0, 1.1], yaxis_range=[0, 1.1])\n",
     "    else:\n",
     "        melted_df = df.melt(id_vars=['Experiment', 'Query_Name', 'Base_Name', 'Interval', 'Type'], value_vars=['Precision', 'Recall', 'F1_Score'])\n",
     "        melted_df = melted_df.rename(columns={'variable': 'Stat', 'value': 'Value'})\n",
-    "        fig = px.bar(melted_df, x='Stat', y='Value', title=f'Performance Stats over {strat} for {type_}', \n",
+    "        fig = px.bar(melted_df, x='Stat', y='Value', title=cfg.make_title(prefix=f'Performance Stats'), \n",
     "                     category_orders=CATEGORY_ORDERS, color_discrete_map=EXPERIMENT_COLOR_MAP)\n",
     "        fig.update_layout(yaxis_range=[0, 1.1])\n",
     "    \n",
     "    return fig\n",
     "\n",
     "\n",
     "def make_stat_covariate_plot(df, covaraite, stat, axes_mode):\n",
-    "    strat = df['Interval'].iloc[0]\n",
-    "    type_ = df['Type'].iloc[0]\n",
-    "    color = None if df['Experiment'].iloc[0] == 'No_ExpGroups_Provided' else 'Experiment'\n",
-    "    fig = px.scatter(df, x=stat_corr, y=stat, color=color, hover_data=['Query_Name', 'TP_Base', 'TP_Query', 'FP', 'FN'],\n",
-    "                      title=f'Plot of {stat} by {covariate} over {strat} for {type_}', \n",
+    "    cfg = SubsetConfig(df)\n",
+    "    \n",
+    "    fig = px.scatter(df, x=stat_corr, y=stat, color=cfg.color, hover_data=['Query_Name', 'TP_Base', 'TP_Query', 'FP', 'FN'],\n",
+    "                      title=cfg.make_title(prefix=f'Plot of {stat} by {covariate}'), \n",
     "                      category_orders=CATEGORY_ORDERS, color_discrete_map=EXPERIMENT_COLOR_MAP)\n",
     "    if axes_mode == 'Fixed':\n",
     "        fig.update_layout(yaxis_range=[0, 1.1])\n",
@@ -492,7 +512,8 @@
    "outputs": [],
    "source": [
     "def make_roc_plot(df, roc_mode, error_bars, axes_mode):\n",
-    "    type_ = df['Type'].iloc[0]\n",
+    "    cfg = SubsetConfig(df)\n",
+    "\n",
     "    if roc_mode in ['Precision', 'Recall']:\n",
     "        error_y = None\n",
     "        if not SINGLE_SAMPLE_MODE:\n",
@@ -503,11 +524,11 @@
     "    \n",
     "        fig = px.line(plot_df, x='Score', y=f'{roc_mode}_mean', error_y=error_y, \n",
     "                      hover_data=['Score', 'TP_Base_mean', 'TP_Query_mean', 'FP_mean', 'FN_mean'],\n",
-    "                      title=f'{roc_mode} Plot for {type_} stratified by Score', color='Experiment',\n",
+    "                      title=cfg.make_title(f'{roc_mode} Plot') + ' stratified by Score', color=cfg.color,\n",
     "                      category_orders=CATEGORY_ORDERS, color_discrete_map=EXPERIMENT_COLOR_MAP)\n",
     "    else:\n",
-    "        fig = px.line(df, x='Recall', y='Precision', color='Experiment', line_group='Query_Name', hover_data=['Score'],\n",
-    "                      title=f'ROC Plot for {type_} stratified by Score')\n",
+    "        fig = px.line(df, x='Recall', y='Precision', color=cfg.color, line_group='Query_Name', hover_data=['Score'],\n",
+    "                      title=cfg.make_title(f'ROC Plot') + ' stratified by Score')\n",
     "        fig.update_layout(xaxis_range=[0, 1.1])\n",
     "\n",
     "    if axes_mode == 'Fixed':\n",
@@ -605,9 +626,7 @@
    "outputs": [],
    "source": [
     "def make_titv_plot(df, stat, axes_mode):\n",
-    "    color = None if df['Experiment'].iloc[0] == 'No_ExpGroups_Provided' else 'Experiment'\n",
-    "    strat = df['Interval'].iloc[0]\n",
-    "    type_ = df['Type'].iloc[0]\n",
+    "    cfg = SubsetConfig(df)\n",
     "\n",
     "    error_y = None\n",
     "    if not SINGLE_SAMPLE_MODE:\n",
@@ -619,17 +638,16 @@
     "    plot_df = plot_df.replace('Ti', 'Transitions').replace('Tv', 'Transversions')\n",
     "\n",
     "    fig = px.bar(plot_df, x='Substitution_Type', y=f'{stat}_mean', error_y=error_y, \n",
-    "                  title=f'Plot of {stat} mean by Substitution Type on {strat} for {type_}', \n",
-    "                  hover_data=['TP_Base_mean', 'TP_Query_mean', 'FP_mean', 'FN_mean', 'IGN_mean', 'OUT_mean'], color=color, barmode='group',\n",
+    "                  title=cfg.make_title(f'Plot of {stat} mean by Substitution Type'), \n",
+    "                  hover_data=['TP_Base_mean', 'TP_Query_mean', 'FP_mean', 'FN_mean', 'IGN_mean', 'OUT_mean'], color=cfg.color, barmode='group',\n",
     "                  category_orders=CATEGORY_ORDERS, color_discrete_map=EXPERIMENT_COLOR_MAP)\n",
     "    if axes_mode == 'Fixed' and stat in ['Precision', 'Recall', 'F1_Score']:\n",
     "        fig.update_layout(yaxis_range=[0, 1.1])\n",
     "    return fig\n",
     "\n",
     "def make_snp_substitution_plot(df, stat, axes_mode):\n",
-    "    color = None if df['Experiment'].iloc[0] == 'No_ExpGroups_Provided' else 'Experiment'\n",
-    "    strat = df['Interval'].iloc[0]\n",
-    "    type_ = df['Type'].iloc[0]\n",
+    "    cfg = SubsetConfig(df)\n",
+    "\n",
     "    df_means = df.groupby(['Experiment', 'Type', 'Substitution_Type', \n",
     "                           'Ref_Nucleotide', 'Var_Nucleotide'])[['TP_Base', 'TP_Query', \n",
     "                                                                 'FP', 'FN', 'F1_Score', 'Precision', 'Recall', 'IGN', 'OUT']].mean().reset_index()\n",
@@ -647,9 +665,9 @@
     "    if EXPERIMENT_ORDER is not None:\n",
     "        category_orders = {**category_orders, **{'Experiment': EXPERIMENT_ORDER}}\n",
     "\n",
-    "    fig = px.scatter_3d(plot_df, x='Ref_Nucleotide', y='Var_Nucleotide', z=f'{stat}_mean', error_z=f'{stat}_conf', color=color, \n",
+    "    fig = px.scatter_3d(plot_df, x='Ref_Nucleotide', y='Var_Nucleotide', z=f'{stat}_mean', error_z=f'{stat}_conf', color=cfg.color, \n",
     "                        hover_data=['TP_Base_mean', 'TP_Query_mean', 'FP_mean', 'FN_mean', 'IGN_mean', 'OUT_mean'],\n",
-    "                        title=f'Plot of {stat} per Substitution Type on {strat} for {type_}', \n",
+    "                        title=cfg.make_title(f'Plot of {stat} per Substitution Type'), \n",
     "                        category_orders=category_orders, symbol='Substitution_Type_mean', color_discrete_map=EXPERIMENT_COLOR_MAP,\n",
     "                        height=700, width=1000,\n",
     "                       )\n",
@@ -745,9 +763,7 @@
    "outputs": [],
    "source": [
     "def make_idd_plot(df, stat, axes_mode):\n",
-    "    color = None if df['Experiment'].iloc[0] == 'No_ExpGroups_Provided' else 'Experiment'\n",
-    "    strat = df['Interval'].iloc[0]\n",
-    "    type_ = df['Type'].iloc[0]\n",
+    "    cfg = SubsetConfig(df)\n",
     "\n",
     "    error_y = None\n",
     "    if not SINGLE_SAMPLE_MODE:\n",
@@ -756,8 +772,8 @@
     "    else:\n",
     "        plot_df = df\n",
     "    \n",
-    "    fig = px.line(plot_df, x='INDEL_Length', y=f'{stat}_mean', error_y=error_y, title=f'Plot of {stat} mean by INDEL Length on {strat} for {type_}', \n",
-    "                  hover_data=['TP_Base_mean', 'TP_Query_mean', 'FP_mean', 'FN_mean', 'IGN_mean', 'OUT_mean'], color=color, line_group=color, \n",
+    "    fig = px.line(plot_df, x='INDEL_Length', y=f'{stat}_mean', error_y=error_y, title=cfg.make_title(f'Plot of {stat} mean by INDEL Length'), \n",
+    "                  hover_data=['TP_Base_mean', 'TP_Query_mean', 'FP_mean', 'FN_mean', 'IGN_mean', 'OUT_mean'], color=cfg.color, line_group=cfg.color, \n",
     "                  category_orders=CATEGORY_ORDERS, color_discrete_map=EXPERIMENT_COLOR_MAP)\n",
     "    if axes_mode == 'Fixed' and stat in ['Precision', 'Recall', 'F1_Score']:\n",
     "        fig.update_layout(yaxis_range=[0, 1.1])\n",
@@ -859,7 +875,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "start_app(board, app_title='BenchmarkBoard', mode='external', port=8055)"
+    "start_app(board, app_title='BenchmarkBoard', jupyter_mode='external', port=8050)"
    ]
   },
   {
@@ -881,9 +897,9 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "quickboard_venv",
+   "display_name": "Python 3 (ipykernel)",
    "language": "python",
-   "name": "quickboard_venv"
+   "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
@@ -895,7 +911,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.9.6"
+   "version": "3.10.9"
   }
  },
  "nbformat": 4,
diff --git a/BenchmarkVCFs/BenchmarkBoard/BenchmarkBoard_README.md b/BenchmarkVCFs/BenchmarkBoard/BenchmarkBoard_README.md
@@ -5,7 +5,7 @@ BenchmarkBoard is an interactive visualizer meant to complement the [SimpleBench
 ## Quickstart
 
 To use the BenchmarkBoard, you must satisfy the following requirements:
-1. Have a Python environment with [Quickboard](https://github.com/broadinstitute/quickboard) installed, e.g. `pip install quickboard`. The current version of this app should use `quickboard==0.3.3`. 
+1. Have a Python environment with [Quickboard](https://github.com/broadinstitute/quickboard) installed, e.g. `pip install quickboard`. The current version of this app should use `quickboard==0.4.0`. 
 2. Have the files output by the SimpleBenchmark tool saved locally with their default names.
 3. Have a copy of the `BenchmarkBoard.py` or `BenchmarkBoard.ipynb` file saved in the *same* directory as the files from the WDL.