From 596196997f03034a526da664db1ec64e8495bd20 Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Wed, 1 May 2024 16:00:40 -0400
Subject: [PATCH 01/29] clastr api proof of concept

---
 poetry.lock                         | 114 ++++++++++------
 pyproject.toml                      |   2 +-
 requirements.txt                    |   2 +-
 strprofiler/shiny_app/clastr_api.py | 197 ++++++++++++++++++++++++++++
 strprofiler/shiny_app/shiny_app.py  |  77 ++++++++++-
 strprofiler/utils.py                |   2 +-
 6 files changed, 346 insertions(+), 48 deletions(-)
 create mode 100644 strprofiler/shiny_app/clastr_api.py

diff --git a/poetry.lock b/poetry.lock
index b35cc6f..d4bed28 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1,4 +1,4 @@
-# This file is automatically @generated by Poetry 1.7.1 and should not be changed by hand.
+# This file is automatically @generated by Poetry 1.8.2 and should not be changed by hand.
 
 [[package]]
 name = "anyio"
@@ -88,13 +88,13 @@ files = [
 
 [[package]]
 name = "exceptiongroup"
-version = "1.2.0"
+version = "1.2.1"
 description = "Backport of PEP 654 (exception groups)"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "exceptiongroup-1.2.0-py3-none-any.whl", hash = "sha256:4bfd3996ac73b41e9b9628b04e079f193850720ea5945fc96a08633c66912f14"},
-    {file = "exceptiongroup-1.2.0.tar.gz", hash = "sha256:91f5c769735f051a4290d52edd0858999b57e5876e9f85937691bd4c9fa3ed68"},
+    {file = "exceptiongroup-1.2.1-py3-none-any.whl", hash = "sha256:5258b9ed329c5bbdd31a309f53cbfb0b155341807f6ff7606a1e801a891b29ad"},
+    {file = "exceptiongroup-1.2.1.tar.gz", hash = "sha256:a4785e48b045528f5bfe627b6ad554ff32def154f42372786903b7abcfe1aa16"},
 ]
 
 [package.extras]
@@ -391,51 +391,76 @@ files = [
 
 [[package]]
 name = "pandas"
-version = "1.5.3"
+version = "2.2.2"
 description = "Powerful data structures for data analysis, time series, and statistics"
 optional = false
-python-versions = ">=3.8"
+python-versions = ">=3.9"
 files = [
-    {file = "pandas-1.5.3-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:3749077d86e3a2f0ed51367f30bf5b82e131cc0f14260c4d3e499186fccc4406"},
-    {file = "pandas-1.5.3-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:972d8a45395f2a2d26733eb8d0f629b2f90bebe8e8eddbb8829b180c09639572"},
-    {file = "pandas-1.5.3-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:50869a35cbb0f2e0cd5ec04b191e7b12ed688874bd05dd777c19b28cbea90996"},
-    {file = "pandas-1.5.3-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:c3ac844a0fe00bfaeb2c9b51ab1424e5c8744f89860b138434a363b1f620f354"},
-    {file = "pandas-1.5.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:7a0a56cef15fd1586726dace5616db75ebcfec9179a3a55e78f72c5639fa2a23"},
-    {file = "pandas-1.5.3-cp310-cp310-win_amd64.whl", hash = "sha256:478ff646ca42b20376e4ed3fa2e8d7341e8a63105586efe54fa2508ee087f328"},
-    {file = "pandas-1.5.3-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:6973549c01ca91ec96199e940495219c887ea815b2083722821f1d7abfa2b4dc"},
-    {file = "pandas-1.5.3-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:c39a8da13cede5adcd3be1182883aea1c925476f4e84b2807a46e2775306305d"},
-    {file = "pandas-1.5.3-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:f76d097d12c82a535fda9dfe5e8dd4127952b45fea9b0276cb30cca5ea313fbc"},
-    {file = "pandas-1.5.3-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:e474390e60ed609cec869b0da796ad94f420bb057d86784191eefc62b65819ae"},
-    {file = "pandas-1.5.3-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:5f2b952406a1588ad4cad5b3f55f520e82e902388a6d5a4a91baa8d38d23c7f6"},
-    {file = "pandas-1.5.3-cp311-cp311-win_amd64.whl", hash = "sha256:bc4c368f42b551bf72fac35c5128963a171b40dce866fb066540eeaf46faa003"},
-    {file = "pandas-1.5.3-cp38-cp38-macosx_10_9_universal2.whl", hash = "sha256:14e45300521902689a81f3f41386dc86f19b8ba8dd5ac5a3c7010ef8d2932813"},
-    {file = "pandas-1.5.3-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:9842b6f4b8479e41968eced654487258ed81df7d1c9b7b870ceea24ed9459b31"},
-    {file = "pandas-1.5.3-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:26d9c71772c7afb9d5046e6e9cf42d83dd147b5cf5bcb9d97252077118543792"},
-    {file = "pandas-1.5.3-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:5fbcb19d6fceb9e946b3e23258757c7b225ba450990d9ed63ccceeb8cae609f7"},
-    {file = "pandas-1.5.3-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:565fa34a5434d38e9d250af3c12ff931abaf88050551d9fbcdfafca50d62babf"},
-    {file = "pandas-1.5.3-cp38-cp38-win32.whl", hash = "sha256:87bd9c03da1ac870a6d2c8902a0e1fd4267ca00f13bc494c9e5a9020920e1d51"},
-    {file = "pandas-1.5.3-cp38-cp38-win_amd64.whl", hash = "sha256:41179ce559943d83a9b4bbacb736b04c928b095b5f25dd2b7389eda08f46f373"},
-    {file = "pandas-1.5.3-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:c74a62747864ed568f5a82a49a23a8d7fe171d0c69038b38cedf0976831296fa"},
-    {file = "pandas-1.5.3-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:c4c00e0b0597c8e4f59e8d461f797e5d70b4d025880516a8261b2817c47759ee"},
-    {file = "pandas-1.5.3-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:a50d9a4336a9621cab7b8eb3fb11adb82de58f9b91d84c2cd526576b881a0c5a"},
-    {file = "pandas-1.5.3-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:dd05f7783b3274aa206a1af06f0ceed3f9b412cf665b7247eacd83be41cf7bf0"},
-    {file = "pandas-1.5.3-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:9f69c4029613de47816b1bb30ff5ac778686688751a5e9c99ad8c7031f6508e5"},
-    {file = "pandas-1.5.3-cp39-cp39-win32.whl", hash = "sha256:7cec0bee9f294e5de5bbfc14d0573f65526071029d036b753ee6507d2a21480a"},
-    {file = "pandas-1.5.3-cp39-cp39-win_amd64.whl", hash = "sha256:dfd681c5dc216037e0b0a2c821f5ed99ba9f03ebcf119c7dac0e9a7b960b9ec9"},
-    {file = "pandas-1.5.3.tar.gz", hash = "sha256:74a3fd7e5a7ec052f183273dc7b0acd3a863edf7520f5d3a1765c04ffdb3b0b1"},
+    {file = "pandas-2.2.2-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:90c6fca2acf139569e74e8781709dccb6fe25940488755716d1d354d6bc58bce"},
+    {file = "pandas-2.2.2-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:c7adfc142dac335d8c1e0dcbd37eb8617eac386596eb9e1a1b77791cf2498238"},
+    {file = "pandas-2.2.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:4abfe0be0d7221be4f12552995e58723c7422c80a659da13ca382697de830c08"},
+    {file = "pandas-2.2.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:8635c16bf3d99040fdf3ca3db669a7250ddf49c55dc4aa8fe0ae0fa8d6dcc1f0"},
+    {file = "pandas-2.2.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:40ae1dffb3967a52203105a077415a86044a2bea011b5f321c6aa64b379a3f51"},
+    {file = "pandas-2.2.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:8e5a0b00e1e56a842f922e7fae8ae4077aee4af0acb5ae3622bd4b4c30aedf99"},
+    {file = "pandas-2.2.2-cp310-cp310-win_amd64.whl", hash = "sha256:ddf818e4e6c7c6f4f7c8a12709696d193976b591cc7dc50588d3d1a6b5dc8772"},
+    {file = "pandas-2.2.2-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:696039430f7a562b74fa45f540aca068ea85fa34c244d0deee539cb6d70aa288"},
+    {file = "pandas-2.2.2-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:8e90497254aacacbc4ea6ae5e7a8cd75629d6ad2b30025a4a8b09aa4faf55151"},
+    {file = "pandas-2.2.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:58b84b91b0b9f4bafac2a0ac55002280c094dfc6402402332c0913a59654ab2b"},
+    {file = "pandas-2.2.2-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:6d2123dc9ad6a814bcdea0f099885276b31b24f7edf40f6cdbc0912672e22eee"},
+    {file = "pandas-2.2.2-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:2925720037f06e89af896c70bca73459d7e6a4be96f9de79e2d440bd499fe0db"},
+    {file = "pandas-2.2.2-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:0cace394b6ea70c01ca1595f839cf193df35d1575986e484ad35c4aeae7266c1"},
+    {file = "pandas-2.2.2-cp311-cp311-win_amd64.whl", hash = "sha256:873d13d177501a28b2756375d59816c365e42ed8417b41665f346289adc68d24"},
+    {file = "pandas-2.2.2-cp312-cp312-macosx_10_9_x86_64.whl", hash = "sha256:9dfde2a0ddef507a631dc9dc4af6a9489d5e2e740e226ad426a05cabfbd7c8ef"},
+    {file = "pandas-2.2.2-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:e9b79011ff7a0f4b1d6da6a61aa1aa604fb312d6647de5bad20013682d1429ce"},
+    {file = "pandas-2.2.2-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:1cb51fe389360f3b5a4d57dbd2848a5f033350336ca3b340d1c53a1fad33bcad"},
+    {file = "pandas-2.2.2-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:eee3a87076c0756de40b05c5e9a6069c035ba43e8dd71c379e68cab2c20f16ad"},
+    {file = "pandas-2.2.2-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:3e374f59e440d4ab45ca2fffde54b81ac3834cf5ae2cdfa69c90bc03bde04d76"},
+    {file = "pandas-2.2.2-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:43498c0bdb43d55cb162cdc8c06fac328ccb5d2eabe3cadeb3529ae6f0517c32"},
+    {file = "pandas-2.2.2-cp312-cp312-win_amd64.whl", hash = "sha256:d187d355ecec3629624fccb01d104da7d7f391db0311145817525281e2804d23"},
+    {file = "pandas-2.2.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:0ca6377b8fca51815f382bd0b697a0814c8bda55115678cbc94c30aacbb6eff2"},
+    {file = "pandas-2.2.2-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:9057e6aa78a584bc93a13f0a9bf7e753a5e9770a30b4d758b8d5f2a62a9433cd"},
+    {file = "pandas-2.2.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:001910ad31abc7bf06f49dcc903755d2f7f3a9186c0c040b827e522e9cef0863"},
+    {file = "pandas-2.2.2-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:66b479b0bd07204e37583c191535505410daa8df638fd8e75ae1b383851fe921"},
+    {file = "pandas-2.2.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:a77e9d1c386196879aa5eb712e77461aaee433e54c68cf253053a73b7e49c33a"},
+    {file = "pandas-2.2.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:92fd6b027924a7e178ac202cfbe25e53368db90d56872d20ffae94b96c7acc57"},
+    {file = "pandas-2.2.2-cp39-cp39-win_amd64.whl", hash = "sha256:640cef9aa381b60e296db324337a554aeeb883ead99dc8f6c18e81a93942f5f4"},
+    {file = "pandas-2.2.2.tar.gz", hash = "sha256:9e79019aba43cb4fda9e4d983f8e88ca0373adbb697ae9c6c43093218de28b54"},
 ]
 
 [package.dependencies]
 numpy = [
-    {version = ">=1.20.3", markers = "python_version < \"3.10\""},
-    {version = ">=1.23.2", markers = "python_version >= \"3.11\""},
-    {version = ">=1.21.0", markers = "python_version >= \"3.10\" and python_version < \"3.11\""},
+    {version = ">=1.22.4", markers = "python_version < \"3.11\""},
+    {version = ">=1.23.2", markers = "python_version == \"3.11\""},
+    {version = ">=1.26.0", markers = "python_version >= \"3.12\""},
 ]
-python-dateutil = ">=2.8.1"
+python-dateutil = ">=2.8.2"
 pytz = ">=2020.1"
+tzdata = ">=2022.7"
 
 [package.extras]
-test = ["hypothesis (>=5.5.3)", "pytest (>=6.0)", "pytest-xdist (>=1.31)"]
+all = ["PyQt5 (>=5.15.9)", "SQLAlchemy (>=2.0.0)", "adbc-driver-postgresql (>=0.8.0)", "adbc-driver-sqlite (>=0.8.0)", "beautifulsoup4 (>=4.11.2)", "bottleneck (>=1.3.6)", "dataframe-api-compat (>=0.1.7)", "fastparquet (>=2022.12.0)", "fsspec (>=2022.11.0)", "gcsfs (>=2022.11.0)", "html5lib (>=1.1)", "hypothesis (>=6.46.1)", "jinja2 (>=3.1.2)", "lxml (>=4.9.2)", "matplotlib (>=3.6.3)", "numba (>=0.56.4)", "numexpr (>=2.8.4)", "odfpy (>=1.4.1)", "openpyxl (>=3.1.0)", "pandas-gbq (>=0.19.0)", "psycopg2 (>=2.9.6)", "pyarrow (>=10.0.1)", "pymysql (>=1.0.2)", "pyreadstat (>=1.2.0)", "pytest (>=7.3.2)", "pytest-xdist (>=2.2.0)", "python-calamine (>=0.1.7)", "pyxlsb (>=1.0.10)", "qtpy (>=2.3.0)", "s3fs (>=2022.11.0)", "scipy (>=1.10.0)", "tables (>=3.8.0)", "tabulate (>=0.9.0)", "xarray (>=2022.12.0)", "xlrd (>=2.0.1)", "xlsxwriter (>=3.0.5)", "zstandard (>=0.19.0)"]
+aws = ["s3fs (>=2022.11.0)"]
+clipboard = ["PyQt5 (>=5.15.9)", "qtpy (>=2.3.0)"]
+compression = ["zstandard (>=0.19.0)"]
+computation = ["scipy (>=1.10.0)", "xarray (>=2022.12.0)"]
+consortium-standard = ["dataframe-api-compat (>=0.1.7)"]
+excel = ["odfpy (>=1.4.1)", "openpyxl (>=3.1.0)", "python-calamine (>=0.1.7)", "pyxlsb (>=1.0.10)", "xlrd (>=2.0.1)", "xlsxwriter (>=3.0.5)"]
+feather = ["pyarrow (>=10.0.1)"]
+fss = ["fsspec (>=2022.11.0)"]
+gcp = ["gcsfs (>=2022.11.0)", "pandas-gbq (>=0.19.0)"]
+hdf5 = ["tables (>=3.8.0)"]
+html = ["beautifulsoup4 (>=4.11.2)", "html5lib (>=1.1)", "lxml (>=4.9.2)"]
+mysql = ["SQLAlchemy (>=2.0.0)", "pymysql (>=1.0.2)"]
+output-formatting = ["jinja2 (>=3.1.2)", "tabulate (>=0.9.0)"]
+parquet = ["pyarrow (>=10.0.1)"]
+performance = ["bottleneck (>=1.3.6)", "numba (>=0.56.4)", "numexpr (>=2.8.4)"]
+plot = ["matplotlib (>=3.6.3)"]
+postgresql = ["SQLAlchemy (>=2.0.0)", "adbc-driver-postgresql (>=0.8.0)", "psycopg2 (>=2.9.6)"]
+pyarrow = ["pyarrow (>=10.0.1)"]
+spss = ["pyreadstat (>=1.2.0)"]
+sql-other = ["SQLAlchemy (>=2.0.0)", "adbc-driver-postgresql (>=0.8.0)", "adbc-driver-sqlite (>=0.8.0)"]
+test = ["hypothesis (>=6.46.1)", "pytest (>=7.3.2)", "pytest-xdist (>=2.2.0)"]
+xml = ["lxml (>=4.9.2)"]
 
 [[package]]
 name = "prompt-toolkit"
@@ -664,6 +689,17 @@ files = [
     {file = "typing_extensions-4.11.0.tar.gz", hash = "sha256:83f085bd5ca59c80295fc2a82ab5dac679cbe02b9f33f7d83af68e241bea51b0"},
 ]
 
+[[package]]
+name = "tzdata"
+version = "2024.1"
+description = "Provider of IANA time zone data"
+optional = false
+python-versions = ">=2"
+files = [
+    {file = "tzdata-2024.1-py2.py3-none-any.whl", hash = "sha256:9068bc196136463f5245e51efda838afa15aaeca9903f49050dfa2679db4d252"},
+    {file = "tzdata-2024.1.tar.gz", hash = "sha256:2674120f8d891909751c38abcdfd386ac0a5a1127954fbc332af6b5ceae07efd"},
+]
+
 [[package]]
 name = "uc-micro-py"
 version = "1.0.3"
@@ -879,4 +915,4 @@ files = [
 [metadata]
 lock-version = "2.0"
 python-versions = ">=3.9,<4.0"
-content-hash = "51da1c89cdbc1170fa0c07a6d445e394791deaf26efaa86b5aa7603b8fcaabcc"
+content-hash = "bada9554d3318a11886e1e0e6d3f020beafe8e4c6db8b9249b3b38fcb6c31ef0"
diff --git a/pyproject.toml b/pyproject.toml
index ccc0b01..f83e082 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -10,7 +10,7 @@ readme = "README.md"
 
 [tool.poetry.dependencies]
 python = ">=3.9,<4.0"
-pandas = "^1.4.3"
+pandas = "^2.2"
 rich-click = "^1.5.2"
 numpy = "^1.26.3"
 openpyxl = "^3.0.10"
diff --git a/requirements.txt b/requirements.txt
index 5473afd..cc6d05c 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,7 +1,7 @@
 # Automatically generated by https://github.com/damnever/pigar.
 
 numpy==1.26.3
-pandas==1.5.3
+pandas==2.2
 rich-click==1.7.3
 shiny==0.8.1
 shinyswatch==0.4.2
diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
new file mode 100644
index 0000000..aa706c8
--- /dev/null
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -0,0 +1,197 @@
+import requests
+import json
+import pandas as pd
+from flatten_json import flatten
+
+
+def clastr_query(query, query_filter, include_amelogenin, score_filter):
+    url = "https://www.cellosaurus.org/str-search/api/query/"
+
+    if query_filter == "Tanabe":
+        query['algorithm'] = 1
+    elif query_filter == "Masters Query":
+        query['algorithm'] = 2
+    elif query_filter == "Masters Reference":
+        query['algorithm'] = 3
+
+    query['includeAmelogenin'] = include_amelogenin
+    query['scoreFilter'] = score_filter
+
+    r = requests.post(url, data=json.dumps(query))
+
+    # JSON response:
+    #   'description': '',
+    #   'cellosaurusRelease': '48.0',
+    #   'runOn': '2024-Apr-25 12:45:40 UTC+0',
+    #   'toolVersion': '1.4.4',
+    #   'searchSpace': 8581,
+    #   'parameters': {...
+    #   'results': [{ ...
+    # FULL STRUCTURE OUTLINED BELOW.
+
+    try:
+        r.raise_for_status()
+    except requests.exceptions.HTTPError as e:
+        return pd.DataFrame({"Error": [str(e)]})
+
+    df = pd.DataFrame.from_dict(r.json()['results'])
+
+    if df.empty:
+        return pd.DataFrame({"No Clastr Result": []})
+
+    flattened = [flatten(d) for d in r.json()['results']]
+    df = pd.DataFrame(flattened)
+
+    # profiles[0] has 'bestScore' returns.
+    # Markers within profiles[0] are split by each allele 'value'
+    # First select alles, and then concat alleles by return and marker
+    markers = df.filter(regex='^profiles_0_.*_value').T
+    markers[['A', 'B', 'C', 'markerID', 'E', 'F', 'G']] = markers.index.str.split('_', n=7, expand=False).tolist()
+    markers.drop(['A', 'B', 'C', 'E', 'F', 'G'], axis=1, inplace=True)
+
+    # Melt dataframe to: [markerID, resultID, allele] for cat on markerID/resultID
+    melted_markers = pd.melt(markers, id_vars=['markerID'], var_name='resultID', value_name='allele')
+
+    # Join resultID and markerID index to grouped joined allele strings.
+    allele_cat_markers = pd.concat([
+        melted_markers[['resultID', 'markerID']],
+        melted_markers.groupby(['resultID', 'markerID'], as_index=True).transform(lambda x: ','
+                                                                                  .join(map(str, x)).replace(",nan", "").replace("nan", ""))
+    ], axis=1).drop_duplicates(subset=['resultID', 'markerID'])
+
+    # Marker names are not consistant across results. MarkerName[1] != the same thing in all cases.
+    # We must track marker name by index by result.
+    # The same logic from above applies, split the compount column name string,
+    # Melt on markerID, and then merge with concat allele made above.
+    # Finally, pivot into a table and rejoin to higher level results.
+    marker_names = df.filter(regex='^profiles_0_.*_name').T
+    marker_names[['A', 'B', 'C', 'markerID', 'E']] = marker_names.index.str.split('_', n=5, expand=False).tolist()
+    marker_names.drop(['A', 'B', 'C', 'E'], axis=1, inplace=True)
+
+    melted_markers = pd.melt(marker_names, id_vars=['markerID'],
+                             var_name='resultID', value_name='markerName').dropna().drop_duplicates(subset=['markerID', 'resultID'])
+
+    markers_names_alleles = pd.merge(allele_cat_markers, melted_markers,  how='inner', on=['markerID', 'resultID'])
+
+    pivot_markers_names_alleles = markers_names_alleles.pivot(index=['resultID'], columns='markerName', values='allele')
+
+    try:
+        merged = pd.merge(df[['accession', 'name', 'species', 'bestScore', 'problem']],
+                          pivot_markers_names_alleles, left_index=True, right_on='resultID')
+    except KeyError:
+        merged = pd.merge(df[['accession', 'name', 'species', 'bestScore']], pivot_markers_names_alleles, left_index=True, right_on='resultID')
+
+    merged['accession_link'] = "https://web.expasy.org/cellosaurus/" + merged['accession']
+    print(merged)
+    # return final df
+
+    # TO DO: Add query to top of merged DF before return.
+
+    return merged
+
+
+if __name__ == '__main__':
+    # url = "https://www.cellosaurus.org/str-search/api/query/%"
+    # Use above URL for 400 error
+
+    # sample J000077451
+    data = {"Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            "D2S1338": "17,19",
+            "D3S1358": "15",
+            "D5S818": "11,12",
+            "D7S820": "11,12",
+            "D8S1179": "12,15",
+            "D13S317": "8",
+            "D16S539": "13",
+            "D18S51": "14",
+            "D19S433": "14",
+            "D21S11": "31,31.2",
+            "FGA": "23",
+            "Penta D": "",
+            "Penta E": "",
+            "TH01": "7,9.3",
+            "TPOX": "8",
+            "vWA": "18",
+            }
+
+    # # stock from https://www.cellosaurus.org/str-search/help.html#5.1
+    # data = {
+    #         "Amelogenin": "X",
+    #         "CSF1PO": "13,14",
+    #         "D5S818": "13",
+    #         "D7S820": "8",
+    #         "D13S317": "12",
+    #         "FGA": "24",
+    #         "TH01": "8",
+    #         "TPOX": "11",
+    #         "vWA": "16",
+    #         }
+
+    r = clastr_query(data, 'Tanabe', False, 70)
+
+    print(r)
+
+#  JSON data structure:
+# {
+#     "description": "",
+#     "cellosaurusRelease": "48.0",
+#     "runOn": "2024-Apr-30 18:15:31 UTC+0",
+#     "toolVersion": "1.4.4",
+#     "searchSpace": 8581,
+#     "parameters": {
+#         "species": "Homo sapiens (Human)",
+#         "algorithm": "Tanabe",
+#         "scoringMode": "Non-empty makers",
+#         "scoreFilter": 70,
+#         "minMarkers": 8,
+#         "maxResults": 200,
+#         "includeAmelogenin": false,
+#         "markers": [ {
+#                 "name": "Amelogenin",
+#                 "alleles": [
+#                     {
+#                         "value": "X"
+#                     },
+#                     {
+#                         "value": "Y"
+#                     }
+#                 ]
+#             }, ... ]
+#     },
+#     "results": [
+#             {
+#                 "accession": "CVCL_2335",
+#                 "name": "CCD-1076Sk",
+#                 "species": "Homo sapiens (Human)",
+#                 "bestScore": 72.0,
+#                 "problematic": false,
+#                 "profiles": [
+#                     {
+#                         "score": 72.0,
+#                         "markerNumber": 8,
+#                         "alleleNumber": 14,
+#                         "markers": [
+#                             {
+#                                 "name": "Amelogenin",
+#                                 "conflicted": false,
+#                                 "searched": true,
+#                                 "sources": [],
+#                                 "alleles": [
+#                                     {
+#                                         "value": "X",
+#                                         "matched": true
+#                                     },
+#                                     {
+#                                         "value": "Y",
+#                                         "matched": true
+#                                     }
+#                                 ]
+#                             },
+#                             ...
+#                     }
+#                     <Note: more than 1 profile possible per result>
+#                     <best score result is profile[0]>
+#             }
+#             <result 2 ... n >
+#     ]
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 7ec1ce0..daf4869 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -6,6 +6,7 @@
 
 import strprofiler.utils as sp
 from strprofiler.shiny_app.calc_functions import _single_query, _batch_query, _file_query
+from strprofiler.shiny_app.clastr_api import clastr_query
 
 from datetime import date
 import time
@@ -65,9 +66,15 @@ def _highlight_non_matches(s):
     is_match = s == s.iloc[0]
     return ["text-align:center;background-color:#ec7a80" if not v else "text-align:center" for v in is_match]
 
-# App Generation ###
+
+def _link_wrap(name, link, problem):
+    if not pd.isna(problem):
+        return ui.tooltip(ui.tags.a(name, href=str(link), target="_blank", style="text-align:center;font-style:oblique;color:#ec7a80"), f"{problem}")
+    else:
+        return ui.tags.a(name, href=str(link), target="_blank")
 
 
+# App Generation ###
 def create_app(db=None):
 
     f = importlib.resources.files("strprofiler.shiny_app")
@@ -93,7 +100,6 @@ def create_app(db=None):
         )
     )
 
-    # TODO move this to a separate function
     app_ui = ui.page_fluid(
         ui.tags.style("#main {padding:12px !important} #sidebar {padding:12px}"),
         ui.tags.style(
@@ -188,6 +194,12 @@ def create_app(db=None):
                                         class_="btn-danger",
                                         width="45%",
                                     ),
+                                    ui.input_action_button(
+                                        "clastr",
+                                        "Clastr",
+                                        class_="btn-success",
+                                        width="45%",
+                                    ),
                                 ),
                             ),
                         ),
@@ -199,10 +211,23 @@ def create_app(db=None):
                         ui.column(3, ui.tags.h3("Results")),
                         ui.column(1, ui.p("")),
                     ),
-                    ui.column(
-                        12,
-                        {"id": "res_card"},
-                        ui.output_table("out_result"),
+                    ui.navset_card_tab(
+                        ui.nav_panel(
+                            "STR Profiler",
+                            ui.column(
+                                12,
+                                {"id": "res_card"},
+                                ui.output_table("out_result"),
+                            ),
+                        ),
+                        ui.nav_panel(
+                            "CLASTR",
+                            ui.column(
+                                12,
+                                {"id": "res_card"},
+                                ui.output_table("clastr_table"),
+                            ),
+                        ),
                     ),
                     full_screen=False,
                     fill=False,
@@ -416,6 +441,7 @@ def server(input, output, session):
         str_database = reactive.value(init_db)
         db_name = reactive.value(init_db_name)
         output_df = reactive.value(None)
+        output_df_clastr = reactive.value(None)
         demo_vals = reactive.value(None)
         demo_name = reactive.value(None)
         markers = reactive.value([i for i in list(init_db[next(iter(init_db))].keys()) if not any([e for e in ['Center', 'Passage'] if e in i])])
@@ -554,6 +580,45 @@ def loaded_example_text():
                 x = ui.strong("")
                 return x
 
+        @reactive.calc
+        @reactive.event(input.clastr)
+        def clastr_results():
+            query = {m: input[m]() for m in markers()}
+            thinking = ui.notification_show("Message ", duration=None)
+            clastr_return = clastr_query(query, input.query_filter(), input.score_amel_query(), input.query_filter_threshold())
+            ui.notification_remove(thinking)
+            return clastr_return
+
+        @output
+        @render.table
+        def clastr_table():
+            output_df_clastr.set(clastr_results())
+            if output_df_clastr() is not None:
+                out_df = output_df_clastr().copy()
+                print(out_df)
+                if ('No Clastr Result' in out_df.columns) | ('Error' in out_df.columns):
+                    return out_df
+                try:
+                    out_df['link'] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, x.problem), axis=1)
+                except Exception:
+                    out_df['link'] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, pd.NA), axis=1)
+                out_df = out_df.drop(['accession', 'accession_link', 'species'], axis=1).rename(
+                    columns={"link": "Accession", "name": "Name", "bestScore": "Score"})
+                cols = list(out_df.columns)
+                cols = [cols[-1]] + cols[:-1]
+                out_df = out_df[cols]
+                out_df = out_df.style.set_table_attributes(
+                    'class="dataframe shiny-table table w-auto"'
+                ).hide(axis="index").format(
+                    {
+                        "Score": "{0:0.2f}",
+                    },
+                    na_rep=""
+                )
+            else:
+                out_df = pd.DataFrame({"No input provided.": []})
+            return out_df
+
         # Dealing with calculating a results table
         # Catch when either reset or search is clicked
         # If reset, clear the query and run to make an empty df.
diff --git a/strprofiler/utils.py b/strprofiler/utils.py
index 33e6ffa..987128f 100644
--- a/strprofiler/utils.py
+++ b/strprofiler/utils.py
@@ -187,7 +187,7 @@ def str_ingress(
         else:
             sys.exit('File extension: ' + path.suffix + ' in file: ' + str(path) + ' is not supported.')
 
-        df = df.applymap(lambda x: x.strip() if isinstance(x, str) else x)
+        df = df.map(lambda x: x.strip() if isinstance(x, str) else x)
 
         df.columns = df.columns.str.strip()
 

From 9916ad9005fab5dac18349037d1a83d608f5ccaa Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Thu, 2 May 2024 14:40:40 -0400
Subject: [PATCH 02/29] query row added, UI adjustment

---
 app.py                              |   3 +
 strprofiler/shiny_app/clastr_api.py |  23 +++-
 strprofiler/shiny_app/shiny_app.py  | 160 +++++++++++++---------------
 3 files changed, 94 insertions(+), 92 deletions(-)
 create mode 100644 app.py

diff --git a/app.py b/app.py
new file mode 100644
index 0000000..69d5d26
--- /dev/null
+++ b/app.py
@@ -0,0 +1,3 @@
+from strprofiler.shiny_app.shiny_app import create_app
+
+app = create_app()
diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
index aa706c8..6a7386b 100644
--- a/strprofiler/shiny_app/clastr_api.py
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -7,6 +7,10 @@
 def clastr_query(query, query_filter, include_amelogenin, score_filter):
     url = "https://www.cellosaurus.org/str-search/api/query/"
 
+    dct = {k: [v] for k, v in query.items()}
+    query_df = pd.DataFrame(dct)
+    query_df['accession'] = 'Query'
+
     if query_filter == "Tanabe":
         query['algorithm'] = 1
     elif query_filter == "Masters Query":
@@ -82,12 +86,23 @@ def clastr_query(query, query_filter, include_amelogenin, score_filter):
         merged = pd.merge(df[['accession', 'name', 'species', 'bestScore']], pivot_markers_names_alleles, left_index=True, right_on='resultID')
 
     merged['accession_link'] = "https://web.expasy.org/cellosaurus/" + merged['accession']
-    print(merged)
-    # return final df
 
-    # TO DO: Add query to top of merged DF before return.
+    # add the query line to the top of merged, and reorder columns
+
+    query_added = pd.concat([query_df, merged]).reset_index(drop=True)
+    query_added["bestScore"] = query_added['bestScore'].map("{0:.2f}".format).replace("nan", "")
+
+    # print(query_added.columns)
+
+    if 'problem' in query_added.columns:
+        query_added = query_added[['accession', 'name', 'species', 'bestScore', 'accession_link', 'problem'] +
+                                  [c for c in query_added if c not in
+                                   ['accession', 'name', 'species', 'bestScore', 'accession_link', 'problem']]].fillna('')
+    else:
+        query_added = query_added[['accession', 'name', 'species', 'bestScore', 'accession_link'] +
+                                  [c for c in query_added if c not in ['accession', 'name', 'species', 'bestScore', 'accession_link']]].fillna('')
 
-    return merged
+    return query_added
 
 
 if __name__ == '__main__':
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index daf4869..0d08163 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -68,7 +68,9 @@ def _highlight_non_matches(s):
 
 
 def _link_wrap(name, link, problem):
-    if not pd.isna(problem):
+    if name == 'Query':
+        return name
+    if problem != "":
         return ui.tooltip(ui.tags.a(name, href=str(link), target="_blank", style="text-align:center;font-style:oblique;color:#ec7a80"), f"{problem}")
     else:
         return ui.tags.a(name, href=str(link), target="_blank")
@@ -182,6 +184,12 @@ def create_app(db=None):
                                 ui.column(4, ui.output_ui("loaded_example_text")),
                                 ui.column(
                                     4,
+                                    ui.input_select(
+                                        "search_type",
+                                        "Search Type",
+                                        ["STR DB", "CLASTR"],
+                                        width="90%"
+                                    ),
                                     ui.input_action_button(
                                         "search",
                                         "Search",
@@ -194,12 +202,6 @@ def create_app(db=None):
                                         class_="btn-danger",
                                         width="45%",
                                     ),
-                                    ui.input_action_button(
-                                        "clastr",
-                                        "Clastr",
-                                        class_="btn-success",
-                                        width="45%",
-                                    ),
                                 ),
                             ),
                         ),
@@ -211,23 +213,10 @@ def create_app(db=None):
                         ui.column(3, ui.tags.h3("Results")),
                         ui.column(1, ui.p("")),
                     ),
-                    ui.navset_card_tab(
-                        ui.nav_panel(
-                            "STR Profiler",
-                            ui.column(
-                                12,
-                                {"id": "res_card"},
-                                ui.output_table("out_result"),
-                            ),
-                        ),
-                        ui.nav_panel(
-                            "CLASTR",
-                            ui.column(
-                                12,
-                                {"id": "res_card"},
-                                ui.output_table("clastr_table"),
-                            ),
-                        ),
+                    ui.column(
+                        12,
+                        {"id": "res_card"},
+                        ui.output_table("out_result"),
                     ),
                     full_screen=False,
                     fill=False,
@@ -418,7 +407,7 @@ def create_app(db=None):
                     icon_svg("github", width="30px"),
                     href="https://github.com/j-andrews7/strprofiler",
                     target="_blank",
-                )
+                ),
             ),
             title=ui.tags.a(
                 ui.tags.img(
@@ -441,7 +430,6 @@ def server(input, output, session):
         str_database = reactive.value(init_db)
         db_name = reactive.value(init_db_name)
         output_df = reactive.value(None)
-        output_df_clastr = reactive.value(None)
         demo_vals = reactive.value(None)
         demo_name = reactive.value(None)
         markers = reactive.value([i for i in list(init_db[next(iter(init_db))].keys()) if not any([e for e in ['Center', 'Passage'] if e in i])])
@@ -580,45 +568,6 @@ def loaded_example_text():
                 x = ui.strong("")
                 return x
 
-        @reactive.calc
-        @reactive.event(input.clastr)
-        def clastr_results():
-            query = {m: input[m]() for m in markers()}
-            thinking = ui.notification_show("Message ", duration=None)
-            clastr_return = clastr_query(query, input.query_filter(), input.score_amel_query(), input.query_filter_threshold())
-            ui.notification_remove(thinking)
-            return clastr_return
-
-        @output
-        @render.table
-        def clastr_table():
-            output_df_clastr.set(clastr_results())
-            if output_df_clastr() is not None:
-                out_df = output_df_clastr().copy()
-                print(out_df)
-                if ('No Clastr Result' in out_df.columns) | ('Error' in out_df.columns):
-                    return out_df
-                try:
-                    out_df['link'] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, x.problem), axis=1)
-                except Exception:
-                    out_df['link'] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, pd.NA), axis=1)
-                out_df = out_df.drop(['accession', 'accession_link', 'species'], axis=1).rename(
-                    columns={"link": "Accession", "name": "Name", "bestScore": "Score"})
-                cols = list(out_df.columns)
-                cols = [cols[-1]] + cols[:-1]
-                out_df = out_df[cols]
-                out_df = out_df.style.set_table_attributes(
-                    'class="dataframe shiny-table table w-auto"'
-                ).hide(axis="index").format(
-                    {
-                        "Score": "{0:0.2f}",
-                    },
-                    na_rep=""
-                )
-            else:
-                out_df = pd.DataFrame({"No input provided.": []})
-            return out_df
-
         # Dealing with calculating a results table
         # Catch when either reset or search is clicked
         # If reset, clear the query and run to make an empty df.
@@ -650,7 +599,6 @@ def loaded_example_text():
 
                 ui.remove_ui("#inserted-downloader")
                 res_click.set(0)
-
                 return None
             if res_click() == 0:
                 ui.insert_ui(
@@ -664,34 +612,70 @@ def loaded_example_text():
                     where="afterEnd",
                 )
                 res_click.set(1)
-
-            return _single_query(
-                query,
-                str_database(),
-                input.score_amel_query(),
-                input.mix_threshold_query(),
-                input.query_filter(),
-                input.query_filter_threshold(),
-            )
+            thinking = ui.notification_show("Message: API Query Running.", duration=None)
+            # isolate input.search_type to prevent trigger when options change.
+            with reactive.isolate():
+                if input.search_type() == 'STR DB':
+                    results = _single_query(
+                                    query,
+                                    str_database(),
+                                    input.score_amel_query(),
+                                    input.mix_threshold_query(),
+                                    input.query_filter(),
+                                    input.query_filter_threshold(),
+                                )
+                elif input.search_type() == 'CLASTR':
+                    results = clastr_query(
+                                    query,
+                                    input.query_filter(),
+                                    input.score_amel_query(),
+                                    input.query_filter_threshold()
+                                )
+            ui.notification_remove(thinking)
+            return results
 
         @output
         @render.table
         def out_result():
             output_df.set(output_results())
             if output_df() is not None:
-                out_df = output_df().copy()
-                out_df = out_df.style.set_table_attributes(
-                    'class="dataframe shiny-table table w-auto"'
-                ).hide(axis="index").apply(_highlight_non_matches, subset=markers(), axis=0).format(
-                    {
-                        "Shared Markers": "{0:0.0f}",
-                        "Shared Alleles": "{0:0.0f}",
-                        "Tanabe Score": "{0:0.2f}",
-                        "Masters Query Score": "{0:0.2f}",
-                        "Masters Ref Score": "{0:0.2f}",
-                    },
-                    na_rep=""
-                )
+                # isolate input.search_type to prevent trigger when options change.
+                with reactive.isolate():
+                    if input.search_type() == 'STR DB':
+                        out_df = output_df().copy()
+                        out_df = out_df.style.set_table_attributes(
+                            'class="dataframe shiny-table table w-auto"'
+                        ).hide(axis="index").apply(_highlight_non_matches, subset=markers(), axis=0).format(
+                            {
+                                "Shared Markers": "{0:0.0f}",
+                                "Shared Alleles": "{0:0.0f}",
+                                "Tanabe Score": "{0:0.2f}",
+                                "Masters Query Score": "{0:0.2f}",
+                                "Masters Ref Score": "{0:0.2f}",
+                            },
+                            na_rep=""
+                        )
+                    elif input.search_type() == 'CLASTR':
+                        out_df = output_df().copy()
+                        print(out_df)
+                        if ('No Clastr Result' in out_df.columns) | ('Error' in out_df.columns):
+                            return out_df
+                        try:
+                            out_df['link'] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, x.problem), axis=1)
+                            out_df.drop(columns=['problem'], inplace=True)
+                        except Exception:
+                            out_df['link'] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, ''), axis=1)
+
+                        out_df = out_df.drop(['accession', 'accession_link', 'species'], axis=1).rename(
+                            columns={"link": "Accession", "name": "Name", "bestScore": "Score"})
+
+                        cols = list(out_df.columns)
+                        cols = [cols[-1]] + cols[:-1]
+
+                        out_df = out_df[cols]
+                        out_df = out_df.style.set_table_attributes(
+                            'class="dataframe shiny-table table w-auto"'
+                        ).hide(axis="index").apply(_highlight_non_matches, subset=markers(), axis=0)
             else:
                 out_df = pd.DataFrame({"No input provided.": []})
             return out_df

From 9bba28fc359420b1cedd480100d39150b8b4e90b Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Thu, 2 May 2024 15:51:20 -0400
Subject: [PATCH 03/29] tooltip added, help updated, req for deploy updated

---
 requirements.txt                    |  5 ++-
 strprofiler/shiny_app/shiny_app.py  | 33 +++++++++-----
 strprofiler/shiny_app/www/help.html | 69 ++++++++++++++++++++++++++---
 strprofiler/shiny_app/www/help.md   | 31 ++++++++++---
 4 files changed, 115 insertions(+), 23 deletions(-)

diff --git a/requirements.txt b/requirements.txt
index cc6d05c..9ebff4b 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,7 +1,10 @@
 # Automatically generated by https://github.com/damnever/pigar.
 
+faicons==0.2.2
+flatten-json==0.1.14
 numpy==1.26.3
-pandas==2.2
+pandas==2.2.2
+requests==2.31.0
 rich-click==1.7.3
 shiny==0.8.1
 shinyswatch==0.4.2
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 0d08163..397fac2 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -187,14 +187,19 @@ def create_app(db=None):
                                     ui.input_select(
                                         "search_type",
                                         "Search Type",
-                                        ["STR DB", "CLASTR"],
+                                        ["STRprofiler Database", "Cellosaurus Database (CLASTR)"],
                                         width="90%"
                                     ),
-                                    ui.input_action_button(
-                                        "search",
-                                        "Search",
-                                        class_="btn-success",
-                                        width="45%",
+                                    ui.tooltip(
+                                        ui.input_action_button(
+                                            "search",
+                                            "Search",
+                                            class_="btn-success",
+                                            width="45%",
+                                        ),
+                                        "Query STRprofilier Database",
+                                        id="tt_selected_search",
+                                        placement="left",
                                     ),
                                     ui.input_action_button(
                                         "reset",
@@ -450,6 +455,14 @@ def database_file():
                 width="100%",
             )
 
+        @reactive.effect
+        @reactive.event(input.search_type)
+        def update_tooltip_msg():
+            if input.search_type() == 'STRprofiler Database':
+                ui.update_tooltip("tt_selected_search", 'Query STRprofilier Database', show=False)
+            if input.search_type() == 'Cellosaurus Database (CLASTR)':
+                ui.update_tooltip("tt_selected_search", 'Query Cellosaurus Database via CLASTR API', show=False)
+
         @render.ui
         @reactive.event(markers)
         def marker_inputs():
@@ -615,7 +628,7 @@ def loaded_example_text():
             thinking = ui.notification_show("Message: API Query Running.", duration=None)
             # isolate input.search_type to prevent trigger when options change.
             with reactive.isolate():
-                if input.search_type() == 'STR DB':
+                if input.search_type() == 'STRprofiler Database':
                     results = _single_query(
                                     query,
                                     str_database(),
@@ -624,7 +637,7 @@ def loaded_example_text():
                                     input.query_filter(),
                                     input.query_filter_threshold(),
                                 )
-                elif input.search_type() == 'CLASTR':
+                elif input.search_type() == 'Cellosaurus Database (CLASTR)':
                     results = clastr_query(
                                     query,
                                     input.query_filter(),
@@ -641,7 +654,7 @@ def out_result():
             if output_df() is not None:
                 # isolate input.search_type to prevent trigger when options change.
                 with reactive.isolate():
-                    if input.search_type() == 'STR DB':
+                    if input.search_type() == 'STRprofiler Database':
                         out_df = output_df().copy()
                         out_df = out_df.style.set_table_attributes(
                             'class="dataframe shiny-table table w-auto"'
@@ -655,7 +668,7 @@ def out_result():
                             },
                             na_rep=""
                         )
-                    elif input.search_type() == 'CLASTR':
+                    elif input.search_type() == 'Cellosaurus Database (CLASTR)':
                         out_df = output_df().copy()
                         print(out_df)
                         if ('No Clastr Result' in out_df.columns) | ('Error' in out_df.columns):
diff --git a/strprofiler/shiny_app/www/help.html b/strprofiler/shiny_app/www/help.html
index 6c1bdf1..513700f 100644
--- a/strprofiler/shiny_app/www/help.html
+++ b/strprofiler/shiny_app/www/help.html
@@ -1524,12 +1524,20 @@ <h2>Default Database</h2>
 Laboratory PDX program</a></p>
 <p>If this app is hosted with a custom database, please contact the host
 for information on the database source.</p>
+</div>
+<div id="clastr-cellosaurus-api-query" class="section level2">
+<h2>CLASTR / Cellosaurus API Query</h2>
+<p>Query of the <a href="https://www.cellosaurus.org/description.html">Cellosaurus</a>
+(Bairoch, 2018) cell line database is also available for single samples
+via the <a href="https://www.cellosaurus.org/str-search/">CLASTR</a>
+(Robin, Capes-Davis, and Bairoch, 2019) <a href="https://www.cellosaurus.org/str-search/help.html#5">REST
+API</a>.</p>
 <hr />
 </div>
 <div id="single-query-report" class="section level2">
 <h2>Single Query Report</h2>
 <p>For individual samples, a report is generated with the following
-fields.</p>
+fields when ‘STR DB’ is selected as the search type.</p>
 <table>
 <colgroup>
 <col width="44%" />
@@ -1562,17 +1570,59 @@ <h2>Single Query Report</h2>
 <tr class="even">
 <td align="left">Tanabe Score</td>
 <td align="left">Tanabe similarity score between the query and database
-sample.</td>
+sample (if Tanabe selected).</td>
 </tr>
 <tr class="odd">
 <td align="left">Master Query Score</td>
 <td align="left">Master ‘Query’ similarity score between the query and
-database sample.</td>
+database sample (if Master Query selected).</td>
 </tr>
 <tr class="even">
 <td align="left">Master Ref Score</td>
 <td align="left">Master ‘Reference’ similarity score between the query
-and database sample.</td>
+and database sample (if Master Ref selected).</td>
+</tr>
+<tr class="odd">
+<td align="left">Markers 1 … n</td>
+<td align="left">Marker alleles with mismatches highlight.</td>
+</tr>
+</tbody>
+</table>
+<p>The report is filtered to include only those samples with greater
+than or equal to the <code>Similarity Score Filter Threshold</code>
+defined by the user, and report only the similarity score selected.</p>
+<p>When ‘CLASTR’ is selected as the search type, a report is generated
+with the following fields:</p>
+<table>
+<colgroup>
+<col width="44%" />
+<col width="55%" />
+</colgroup>
+<thead>
+<tr class="header">
+<th align="left">Output Field</th>
+<th align="left">Description</th>
+</tr>
+</thead>
+<tbody>
+<tr class="odd">
+<td align="left">Accession</td>
+<td align="left">Cellosaurus cell line accession ID. Links are provided
+to each accession information page.</td>
+</tr>
+<tr class="even">
+<td align="left">Name</td>
+<td align="left">Cell line name.</td>
+</tr>
+<tr class="odd">
+<td align="left">Score</td>
+<td align="left">Similarity score between the query and cell line
+sample. Reported score reflectes the selected Similarity Score
+Filter.</td>
+</tr>
+<tr class="even">
+<td align="left">Markers 1 … n</td>
+<td align="left">Marker alleles with mismatches highlight.</td>
 </tr>
 </tbody>
 </table>
@@ -1716,14 +1766,21 @@ <h2>Batch and File Query Specfic</h2>
 <hr />
 </div>
 </div>
-<div id="reference" class="section level1">
-<h1>Reference</h1>
+<div id="references" class="section level1">
+<h1>References</h1>
 <p><code>strprofiler</code> is provided under the MIT license. If you
 use this app in your research please cite:<br />
 Jared Andrews, Mike Lloyd, &amp; Sam Culley. (2024).
 <a href="https://github.com/j-andrews7/strprofiler" target="_blank">j-andrews7/strprofiler</a>:
 v0.2.0. Zenodo.
 <a href="https://doi.org/10.5281/zenodo.10544686" target="_blank">https://doi.org/10.5281/zenodo.10544686</a></p>
+<p>Bairoch A. (2018) The Cellosaurus, a cell line knowledge resource.
+Journal of Biomolecular Techniques. 29:25-38. DOI:
+10.7171/jbt.18-2902-002; PMID: 29805321</p>
+<p>Robin, T., Capes-Davis, A. &amp; Bairoch, A. (2019) CLASTR: the
+Cellosaurus STR Similarity Search Tool - A Precious Help for Cell Line
+Authentication. International Journal of Cancer. PubMed: 31444973  DOI:
+10.1002/IJC.32639</p>
 </div>
 
 
diff --git a/strprofiler/shiny_app/www/help.md b/strprofiler/shiny_app/www/help.md
index c6b61f1..7aac4c7 100644
--- a/strprofiler/shiny_app/www/help.md
+++ b/strprofiler/shiny_app/www/help.md
@@ -20,21 +20,36 @@ The report will differ depending on if an individual sample or batch of samples
 ## Default Database
 Current data underlying the default database were provided by: [The Jackson Laboratory PDX program](https://tumor.informatics.jax.org/mtbwi/pdxSearch.do)  
 
-If this app is hosted with a custom database, please contact the host for information on the database source.
+If this app is hosted with a custom database, please contact the host for information on the database source.  
+
+## CLASTR / Cellosaurus API Query
+Query of the [Cellosaurus](https://www.cellosaurus.org/description.html) (Bairoch, 2018) cell line database is also available for single samples via the [CLASTR](https://www.cellosaurus.org/str-search/) (Robin, Capes-Davis, and Bairoch, 2019) [REST API](https://www.cellosaurus.org/str-search/help.html#5).  
 
 ---
 
 ## Single Query Report
-For individual samples, a report is generated with the following fields.  
+For individual samples, a report is generated with the following fields when 'STR DB' is selected as the search type.  
 
 | Output Field | Description |
 | :--- |    :----   |
 | Mixed Sample      | Flag to indicate sample mixing. Sample mixing is determined by the "'Mixed' Sample Threshold" option. If more markers are tri+ allelic than the threshold, samples are flagged as potentially mixed. |
 | Shared Markers   | Number of markers shared between the query and database sample. |
 | Shared Alleles   | Number of alleles shared between the query and database sample. |
-| Tanabe Score | Tanabe similarity score between the query and database sample. |
-| Master Query Score | Master 'Query' similarity score between the query and database sample. |
-| Master Ref Score | Master 'Reference' similarity score between the query and database sample. |
+| Tanabe Score | Tanabe similarity score between the query and database sample (if Tanabe selected). |
+| Master Query Score | Master 'Query' similarity score between the query and database sample (if Master Query selected). |
+| Master Ref Score | Master 'Reference' similarity score between the query and database sample (if Master Ref selected). |
+| Markers 1 ... n | Marker alleles with mismatches highlight. |
+
+The report is filtered to include only those samples with greater than or equal to the `Similarity Score Filter Threshold` defined by the user, and report only the similarity score selected.    
+
+When 'CLASTR' is selected as the search type, a report is generated with the following fields:  
+
+| Output Field | Description |
+| :--- |    :----   |
+| Accession      | Cellosaurus cell line accession ID. Links are provided to each accession information page. |
+| Name   | Cell line name. |
+| Score | Similarity score between the query and cell line sample. Reported score reflectes the selected Similarity Score Filter. |
+| Markers 1 ... n | Marker alleles with mismatches highlight. |
 
 The report is filtered to include only those samples with greater than or equal to the `Similarity Score Filter Threshold` defined by the user.  
 
@@ -108,7 +123,11 @@ For batch samples entered in the File Query tab, `STR Similarity` will generate
 
 ---
 
-# Reference
+# References
 
 `strprofiler` is provided under the MIT license. If you use this app in your research please cite:    
 Jared Andrews, Mike Lloyd, & Sam Culley. (2024). <a href="https://github.com/j-andrews7/strprofiler" target="_blank">j-andrews7/strprofiler</a>: v0.2.0. Zenodo. <a href="https://doi.org/10.5281/zenodo.10544686" target="_blank">https://doi.org/10.5281/zenodo.10544686</a>
+
+Bairoch A. (2018) The Cellosaurus, a cell line knowledge resource. Journal of Biomolecular Techniques. 29:25-38. DOI: 10.7171/jbt.18-2902-002; PMID: 29805321 
+
+Robin, T., Capes-Davis, A. & Bairoch, A. (2019) CLASTR: the Cellosaurus STR Similarity Search Tool - A Precious Help for Cell Line Authentication. International Journal of Cancer. PubMed: 31444973  DOI: 10.1002/IJC.32639
\ No newline at end of file

From 1cd2ef4b07220af54eaac4f831be246bbc7c2e3a Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Fri, 3 May 2024 08:39:03 -0400
Subject: [PATCH 04/29] add window title

---
 strprofiler/shiny_app/shiny_app.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 397fac2..17fcbfd 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -103,6 +103,7 @@ def create_app(db=None):
     )
 
     app_ui = ui.page_fluid(
+        ui.panel_title('', "STR Profiler"),
         ui.tags.style("#main {padding:12px !important} #sidebar {padding:12px}"),
         ui.tags.style(
             ".h3 {margin-bottom:0.1rem; line-height:1} .card-body {padding-top:6px; padding-bottom:6px}"

From 86453204cefdb0f6962e7073d780f3b3e9aa9cf4 Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Thu, 9 May 2024 15:33:28 -0400
Subject: [PATCH 05/29] clastr batch method rough in

---
 strprofiler/shiny_app/clastr_api.py |  62 +++++++++++-
 strprofiler/shiny_app/shiny_app.py  | 142 +++++++++++++++++++---------
 2 files changed, 154 insertions(+), 50 deletions(-)

diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
index 6a7386b..0082298 100644
--- a/strprofiler/shiny_app/clastr_api.py
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -4,7 +4,7 @@
 from flatten_json import flatten
 
 
-def clastr_query(query, query_filter, include_amelogenin, score_filter):
+def _clastr_query(query, query_filter, include_amelogenin, score_filter):
     url = "https://www.cellosaurus.org/str-search/api/query/"
 
     dct = {k: [v] for k, v in query.items()}
@@ -65,7 +65,7 @@ def clastr_query(query, query_filter, include_amelogenin, score_filter):
 
     # Marker names are not consistant across results. MarkerName[1] != the same thing in all cases.
     # We must track marker name by index by result.
-    # The same logic from above applies, split the compount column name string,
+    # The same logic from above applies, split the compound column name string,
     # Melt on markerID, and then merge with concat allele made above.
     # Finally, pivot into a table and rejoin to higher level results.
     marker_names = df.filter(regex='^profiles_0_.*_name').T
@@ -105,6 +105,30 @@ def clastr_query(query, query_filter, include_amelogenin, score_filter):
     return query_added
 
 
+def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
+    url = "https://www.cellosaurus.org/str-search/api/batch/"
+
+    if query_filter == "Tanabe":
+        query = [dict(item, **{'algorithm': 1}) for item in query]
+    elif query_filter == "Masters Query":
+        query = [dict(item, **{'algorithm': 2}) for item in query]
+    elif query_filter == "Masters Reference":
+        query = [dict(item, **{'algorithm': 2}) for item in query]
+
+    query = [dict(item, **{'includeAmelogenin': include_amelogenin}) for item in query]
+    query = [dict(item, **{'scoreFilter': score_filter}) for item in query]
+    query = [dict(item, **{'outputFormat': 'xlsx'}) for item in query]
+
+    r = requests.post(url, data=json.dumps(query))
+
+    try:
+        r.raise_for_status()
+    except requests.exceptions.HTTPError as e:
+        return pd.DataFrame({"Error": [str(e)]})
+
+    return r
+
+
 if __name__ == '__main__':
     # url = "https://www.cellosaurus.org/str-search/api/query/%"
     # Use above URL for 400 error
@@ -143,10 +167,42 @@ def clastr_query(query, query_filter, include_amelogenin, score_filter):
     #         "vWA": "16",
     #         }
 
-    r = clastr_query(data, 'Tanabe', False, 70)
+    r = _clastr_query(data, 'Tanabe', False, 70)
 
     print(r)
 
+    batch_data = [{
+        "description": "Example 1",
+        "Amelogenin": "X",
+        "CSF1PO": "13,14",
+        "D5S818": "13",
+        "D7S820": "8",
+        "D13S317": "12",
+        "FGA": "24",
+        "TH01": "8",
+        "TPOX": "11",
+        "vWA": "16",
+        }, {
+        "description": "Example 2",
+        "Amelogenin": "X, Y",
+        "CSF1PO": "13",
+        "D5S818": "13, 14",
+        "D7S820": "8, 19",
+        "D13S317": "11, 12",
+        "FGA": "24",
+        "TH01": "8",
+        "TPOX": "11",
+        "vWA": "15",
+        "outputFormat": "xlsx"
+        }]
+
+    r = _clastr_batch_query(batch_data, 'Tanabe', False, 70)
+
+    with open('testing.xlsx', 'wb') as fd:
+        for chunk in r.iter_content(chunk_size=128):
+            fd.write(chunk)
+
+
 #  JSON data structure:
 # {
 #     "description": "",
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 17fcbfd..b977253 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -6,7 +6,7 @@
 
 import strprofiler.utils as sp
 from strprofiler.shiny_app.calc_functions import _single_query, _batch_query, _file_query
-from strprofiler.shiny_app.clastr_api import clastr_query
+from strprofiler.shiny_app.clastr_api import _clastr_query, _clastr_batch_query
 
 from datetime import date
 import time
@@ -272,6 +272,12 @@ def create_app(db=None):
                                     multiple=False,
                                     width="100%",
                                 ),
+                                ui.input_select(
+                                    "search_type_batch",
+                                    "Search Type",
+                                    ["STRprofiler Database", "Cellosaurus Database (CLASTR)"],
+                                    width="100%"
+                                ),
                                 ui.input_action_button(
                                     "csv_query",
                                     "CSV Query",
@@ -639,7 +645,7 @@ def loaded_example_text():
                                     input.query_filter_threshold(),
                                 )
                 elif input.search_type() == 'Cellosaurus Database (CLASTR)':
-                    results = clastr_query(
+                    results = _clastr_query(
                                     query,
                                     input.query_filter(),
                                     input.score_amel_query(),
@@ -693,6 +699,7 @@ def out_result():
             else:
                 out_df = pd.DataFrame({"No input provided.": []})
             return out_df
+        # TO DO: Remove results table when changing query methods.
 
         # Dealing with downloading results, when requested.
         # Note that output_results() is a reactive Calc result.
@@ -718,26 +725,31 @@ def download():
         @render.data_frame
         def out_batch_df():
             output_df.set(batch_query_results())
-            try:
-                return render.DataTable(output_df())
-            except Exception:
-                m = ui.modal(
-                    ui.div(
-                        {"style": "font-size: 18px"},
-                        ui.HTML(
-                            (
-                                "There was a fatal error in the query.<br><br>"
-                                "Ensure marker names match expectation, and that"
-                                " no special characters (spaces, etc.) were used in sample names."
-                            )
-                        ),
-                    ),
-                    title="Batch Query Error",
-                    easy_close=True,
-                    footer=None,
-                )
-                ui.modal_show(m)
-                return render.DataTable(pd.DataFrame({"Failed Query. Fix Input File": []}))
+            print(output_df)
+            with reactive.isolate():
+                if input.search_type_batch() == 'STRprofiler Database':
+                    try:
+                        return render.DataTable(output_df())
+                    except Exception:
+                        m = ui.modal(
+                            ui.div(
+                                {"style": "font-size: 18px"},
+                                ui.HTML(
+                                    (
+                                        "There was a fatal error in the query.<br><br>"
+                                        "Ensure marker names match expectation, and that"
+                                        " no special characters (spaces, etc.) were used in sample names."
+                                    )
+                                ),
+                            ),
+                            title="Batch Query Error",
+                            easy_close=True,
+                            footer=None,
+                        )
+                        ui.modal_show(m)
+                        return render.DataTable(pd.DataFrame({"Failed Query. Fix Input File": []}))
+                elif input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
+                    return render.DataTable(pd.DataFrame({"CASTR Batch Query": ['Download Results']}))
 
         # File input loading
         @reactive.calc
@@ -776,39 +788,75 @@ def batch_query_results():
                 return pd.DataFrame({"Failed Query. Fix Input File": []})
 
             if res_click_file() == 0:
-                ui.insert_ui(
-                    ui.div(
-                        {"id": "inserted-downloader2"},
-                        ui.download_button(
-                            "download2", "Download CSV", width="25%", class_="btn-primary"
+                if input.search_type_batch() == 'STRprofiler Database':
+                    ui.insert_ui(
+                        ui.div(
+                            {"id": "inserted-downloader2"},
+                            ui.download_button(
+                                "download2", "Download CSV", width="25%", class_="btn-primary"
+                            ),
                         ),
-                    ),
-                    selector="#res_card_batch",
-                    where="beforeEnd",
-                )
-                res_click_file.set(1)
-            return _batch_query(
-                query_df,
-                str_database(),
-                input.score_amel_batch(),
-                input.mix_threshold_batch(),
-                input.tan_threshold_batch(),
-                input.mas_q_threshold_batch(),
-                input.mas_r_threshold_batch(),
-            )
+                        selector="#res_card_batch",
+                        where="beforeEnd",
+                    )
+                    res_click_file.set(1)
+                elif input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
+                    ui.insert_ui(
+                        ui.div(
+                            {"id": "inserted-downloader2"},
+                            ui.download_button(
+                                "download2", "Download XLSX", width="25%", class_="btn-primary"
+                            ),
+                        ),
+                        selector="#res_card_batch",
+                        where="beforeEnd",
+                    )
+                    res_click_file.set(1)
+
+            with reactive.isolate():
+                if input.search_type_batch() == 'STRprofiler Database':
+                    results = _batch_query(
+                        query_df,
+                        str_database(),
+                        input.score_amel_batch(),
+                        input.mix_threshold_batch(),
+                        input.tan_threshold_batch(),
+                        input.mas_q_threshold_batch(),
+                        input.mas_r_threshold_batch(),
+                    )
+                elif input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
+                    clastr_query = [(lambda d: d.update(description=key) or d)(val) for (key, val) in query_df.items()]
+                    results = _clastr_batch_query(
+                                    clastr_query,
+                                    input.query_filter(),
+                                    input.score_amel_batch(),
+                                    input.query_filter_threshold()
+                                )
+                    # TO DO: Change to a batch filter option set.
+            return results
+
+        # File input loading
+        @reactive.effect
+        @reactive.event(input.search_type_batch)
+        def _():
+            ui.remove_ui("#inserted-downloader2")
+            res_click_file.set(0)
+            # TO DO: Remove batch results table when changing methods.
 
         # Dealing with dowloading results, when requested.
         # Note that batch_query_results() is a reactive Calc result.
         @render.download(
-            filename="STR_Batch_Results_"
-            + date.today().isoformat()
-            + "_"
-            + time.strftime("%Hh-%Mm", time.localtime())
-            + ".csv"
+            filename=lambda: "STR_Batch_Results_" + date.today().isoformat() + "_" + time.strftime("%Hh-%Mm", time.localtime()) + ".csv"
+            if f"{input.search_type_batch()}" == 'STRprofiler Database'
+            else "STR_Batch_Results_" + date.today().isoformat() + "_" + time.strftime("%Hh-%Mm", time.localtime()) + ".xlsx"
         )
         def download2():
             if batch_query_results() is not None:
-                yield batch_query_results().to_csv(index=False)
+                if input.search_type_batch() == 'STRprofiler Database':
+                    yield batch_query_results().to_csv(index=False)
+                if input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
+                    for chunk in batch_query_results().iter_content(chunk_size=128):
+                        yield chunk
 
         # Dealing with passing example file to user.
         @render.download()

From 1bd91a99be750effb4dc609d3bd1d5df26ddeac6 Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Tue, 14 May 2024 12:32:45 -0500
Subject: [PATCH 06/29] add requirements, bump version

---
 .gitignore            | 1 +
 CHANGELOG.md          | 7 +++++++
 docs/requirements.txt | 4 +++-
 pyproject.toml        | 4 +++-
 requirements.txt      | 3 ++-
 5 files changed, 16 insertions(+), 3 deletions(-)

diff --git a/.gitignore b/.gitignore
index bad588f..719d172 100644
--- a/.gitignore
+++ b/.gitignore
@@ -25,6 +25,7 @@ share/python-wheels/
 .installed.cfg
 *.egg
 MANIFEST
+.conda/*
 
 # PyInstaller
 #  Usually these files are written by a python script from a template
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 0ea17a6..ef1f28f 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,12 @@
 # Changelog
 
+## v0.3.0
+
+**Release date:**
+
+ - Added ability to query the CLASTR API for single or batch queries from within the STRprofiler 
+ app - [#24](https://github.com/j-andrews7/strprofiler/pull/24).
+
 ## v0.2.0
 
 **Release date: 04/16/2024**
diff --git a/docs/requirements.txt b/docs/requirements.txt
index 367585e..c262090 100644
--- a/docs/requirements.txt
+++ b/docs/requirements.txt
@@ -4,4 +4,6 @@ myst-parser
 rich-click
 shiny
 shinyswatch
-faicons
\ No newline at end of file
+faicons
+requests
+flatten-json
\ No newline at end of file
diff --git a/pyproject.toml b/pyproject.toml
index f83e082..834af42 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "strprofiler"
-version = "0.2.0"
+version = "0.3.0"
 description = "A simple python utility to compare short tandem repeat (STR) profiles."
 authors = ["Jared Andrews <jared.andrews07@gmail.com>",
            "Mike Lloyd <mike.lloyd@jax.org>"]
@@ -18,6 +18,8 @@ shiny = "^0.8.0"
 shinyswatch = "^0.4.2"
 Jinja2 = "^3.1.3"
 faicons = "^0.2.2"
+requests = "^2.31.0"
+flatten-json = "^0.1.14"
 
 [tool.poetry.dev-dependencies]
 
diff --git a/requirements.txt b/requirements.txt
index 9ebff4b..daba595 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -8,4 +8,5 @@ requests==2.31.0
 rich-click==1.7.3
 shiny==0.8.1
 shinyswatch==0.4.2
-Jinja2==3.1.2
\ No newline at end of file
+Jinja2==3.1.2
+requests==2.31.0
\ No newline at end of file

From 579a1cf82538d398a12a7ccd0f5c160e277773c1 Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Thu, 16 May 2024 09:16:23 -0400
Subject: [PATCH 07/29] fix for #26

---
 .gitignore                          |  3 +-
 strprofiler/shiny_app/clastr_api.py | 44 ++++++++++++++++++++++++++---
 strprofiler/shiny_app/shiny_app.py  |  1 -
 3 files changed, 42 insertions(+), 6 deletions(-)

diff --git a/.gitignore b/.gitignore
index 719d172..8599a3a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -153,4 +153,5 @@ cython_debug/
 #.idea/
 .DS_Store
 
-strprofiler.json
\ No newline at end of file
+strprofiler.json
+testing.xlsx
diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
index 0082298..60ade3d 100644
--- a/strprofiler/shiny_app/clastr_api.py
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -18,6 +18,16 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
     elif query_filter == "Masters Reference":
         query['algorithm'] = 3
 
+    if "PentaD" in query.keys():
+        query["Penta D"] = query.pop("PentaD")
+    elif "Penta_D" in query.keys():
+        query["Penta D"] = query.pop("Penta_D")
+
+    if "PentaE" in query.keys():
+        query["Penta E"] = query.pop("PentaE")
+    elif "Penta_E" in query.keys():
+        query["Penta E"] = query.pop("Penta_E")
+
     query['includeAmelogenin'] = include_amelogenin
     query['scoreFilter'] = score_filter
 
@@ -87,6 +97,11 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
 
     merged['accession_link'] = "https://web.expasy.org/cellosaurus/" + merged['accession']
 
+    if "Penta D" in merged.keys():
+        merged["PentaD"] = merged.pop("Penta D")
+    if "Penta E" in merged.keys():
+        merged["PentaE"] = merged.pop("Penta E")
+
     # add the query line to the top of merged, and reorder columns
 
     query_added = pd.concat([query_df, merged]).reset_index(drop=True)
@@ -147,8 +162,8 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
             "D19S433": "14",
             "D21S11": "31,31.2",
             "FGA": "23",
-            "Penta D": "",
-            "Penta E": "",
+            "PentaD": "",
+            "PentaE": "",
             "TH01": "7,9.3",
             "TPOX": "8",
             "vWA": "18",
@@ -159,12 +174,33 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
     #         "Amelogenin": "X",
     #         "CSF1PO": "13,14",
     #         "D5S818": "13",
-    #         "D7S820": "8",
+    #         "D7S820": "8,9",
     #         "D13S317": "12",
     #         "FGA": "24",
     #         "TH01": "8",
     #         "TPOX": "11",
-    #         "vWA": "16",
+    #         "vWA": "16"
+    #         }
+
+    # # stock example from https://www.cellosaurus.org/str-search/
+    # data = {"Amelogenin": "X",
+    #         "CSF1PO": "11,12",
+    #         "D2S1338": "19,23",
+    #         "D3S1358": "15,17",
+    #         "D5S818": "11,12",
+    #         "D7S820": "10",
+    #         "D8S1179": "10",
+    #         "D13S317": "11,12",
+    #         "D16S539": "11,12",
+    #         "D18S51": "13",
+    #         "D19S433": "14",
+    #         "D21S11": "29,30",
+    #         "FGA": "20,22",
+    #         "PentaD": "11,14",
+    #         "PentaE": "14,16",
+    #         "TH01": "6,9",
+    #         "TPOX": "8,9",
+    #         "vWA": "17,19"
     #         }
 
     r = _clastr_query(data, 'Tanabe', False, 70)
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index b977253..ff1c2c5 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -677,7 +677,6 @@ def out_result():
                         )
                     elif input.search_type() == 'Cellosaurus Database (CLASTR)':
                         out_df = output_df().copy()
-                        print(out_df)
                         if ('No Clastr Result' in out_df.columns) | ('Error' in out_df.columns):
                             return out_df
                         try:

From 77529be3f0844788a68b5eec75cec79557038fe2 Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Thu, 16 May 2024 10:02:43 -0500
Subject: [PATCH 08/29] additional tweaks for #26

---
 strprofiler/shiny_app/clastr_api.py | 21 +++++----------
 strprofiler/utils.py                | 41 ++++++++++++++++++++++-------
 2 files changed, 37 insertions(+), 25 deletions(-)

diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
index 60ade3d..16f1c26 100644
--- a/strprofiler/shiny_app/clastr_api.py
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -2,7 +2,7 @@
 import json
 import pandas as pd
 from flatten_json import flatten
-
+from strprofiler.utils import _pentafix
 
 def _clastr_query(query, query_filter, include_amelogenin, score_filter):
     url = "https://www.cellosaurus.org/str-search/api/query/"
@@ -17,16 +17,8 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
         query['algorithm'] = 2
     elif query_filter == "Masters Reference":
         query['algorithm'] = 3
-
-    if "PentaD" in query.keys():
-        query["Penta D"] = query.pop("PentaD")
-    elif "Penta_D" in query.keys():
-        query["Penta D"] = query.pop("Penta_D")
-
-    if "PentaE" in query.keys():
-        query["Penta E"] = query.pop("PentaE")
-    elif "Penta_E" in query.keys():
-        query["Penta E"] = query.pop("Penta_E")
+    
+    query = _pentafix(query, reverse = True)
 
     query['includeAmelogenin'] = include_amelogenin
     query['scoreFilter'] = score_filter
@@ -97,10 +89,7 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
 
     merged['accession_link'] = "https://web.expasy.org/cellosaurus/" + merged['accession']
 
-    if "Penta D" in merged.keys():
-        merged["PentaD"] = merged.pop("Penta D")
-    if "Penta E" in merged.keys():
-        merged["PentaE"] = merged.pop("Penta E")
+    merged = _pentafix(merged)
 
     # add the query line to the top of merged, and reorder columns
 
@@ -123,6 +112,8 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
 def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
     url = "https://www.cellosaurus.org/str-search/api/batch/"
 
+    query = [_pentafix(item, reverse = True) for item in query]
+
     if query_filter == "Tanabe":
         query = [dict(item, **{'algorithm': 1}) for item in query]
     elif query_filter == "Masters Query":
diff --git a/strprofiler/utils.py b/strprofiler/utils.py
index 987128f..d3e533d 100644
--- a/strprofiler/utils.py
+++ b/strprofiler/utils.py
@@ -35,17 +35,38 @@ def _clean_element(x):
     return ",".join(sorted_elements)
 
 
-def _pentafix(samps_dict):
+def _pentafix(samps_dict, reverse = False):
     """Takes a dictionary of alleles and returns a dictionary with common Penta markers renamed for consistency."""
-    if "Penta D" in samps_dict.keys():
-        samps_dict["PentaD"] = samps_dict.pop("Penta D")
-    elif "Penta_D" in samps_dict.keys():
-        samps_dict["PentaD"] = samps_dict.pop("Penta_D")
-
-    if "Penta E" in samps_dict.keys():
-        samps_dict["PentaE"] = samps_dict.pop("Penta E")
-    elif "Penta_E" in samps_dict.keys():
-        samps_dict["PentaE"] = samps_dict.pop("Penta_E")
+    if not reverse:
+        if "Penta C" in samps_dict.keys():
+            samps_dict["PentaC"] = samps_dict.pop("Penta C")
+        elif "Penta_C" in samps_dict.keys():
+            samps_dict["PentaC"] = samps_dict.pop("Penta_C")
+            
+        if "Penta D" in samps_dict.keys():
+            samps_dict["PentaD"] = samps_dict.pop("Penta D")
+        elif "Penta_D" in samps_dict.keys():
+            samps_dict["PentaD"] = samps_dict.pop("Penta_D")
+
+        if "Penta E" in samps_dict.keys():
+            samps_dict["PentaE"] = samps_dict.pop("Penta E")
+        elif "Penta_E" in samps_dict.keys():
+            samps_dict["PentaE"] = samps_dict.pop("Penta_E")
+    else:
+        if "PentaC" in samps_dict.keys():
+            samps_dict["Penta C"] = samps_dict.pop("PentaC")
+        elif "Penta_C" in samps_dict.keys():
+            samps_dict["Penta C"] = samps_dict.pop("Penta_C")
+
+        if "PentaD" in samps_dict.keys():
+            samps_dict["Penta D"] = samps_dict.pop("PentaD")
+        elif "Penta_D" in samps_dict.keys():
+            samps_dict["Penta D"] = samps_dict.pop("Penta_D")
+
+        if "PentaE" in samps_dict.keys():
+            samps_dict["Penta E"] = samps_dict.pop("PentaE")
+        elif "Penta_E" in samps_dict.keys():
+            samps_dict["Penta E"] = samps_dict.pop("Penta_E")
 
     return samps_dict
 

From 771c133d9ac628ff546a5071a9dc1b4293949d35 Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Thu, 16 May 2024 11:26:25 -0400
Subject: [PATCH 09/29] add marker check for single query

---
 strprofiler/shiny_app/clastr_api.py | 58 +++++++++++++++++++++++++++--
 strprofiler/shiny_app/shiny_app.py  | 19 +++++++++-
 2 files changed, 73 insertions(+), 4 deletions(-)

diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
index 16f1c26..e3c5157 100644
--- a/strprofiler/shiny_app/clastr_api.py
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -4,6 +4,53 @@
 from flatten_json import flatten
 from strprofiler.utils import _pentafix
 
+
+def _valid_marker_check(markers):
+
+    valid_api_markers = ['Amelogenin',
+                         'CSF1PO',
+                         'D2S1338',
+                         'D3S1358',
+                         'D5S818',
+                         'D7S820',
+                         'D8S1179',
+                         'D13S317',
+                         'D16S539',
+                         'D18S51',
+                         'D19S433',
+                         'D21S11',
+                         'FGA',
+                         'Penta D',
+                         'Penta E',
+                         'PentaD',
+                         'PentaE',
+                         'TH01',
+                         'TPOX',
+                         'vWA',
+                         'D1S1656',
+                         'D2S441',
+                         'D6S1043',
+                         'D10S1248',
+                         'D12S391',
+                         'D22S1045',
+                         'DXS101',
+                         'DYS391',
+                         'F13A01',
+                         'F13B',
+                         'FESFPS',
+                         'LPL',
+                         'Penta C',
+                         'PentaC',
+                         'SE33']
+
+    # remove extra fields, if present as keys may come from _clastr_query or other.
+    query_markers = [marker for marker in markers if marker not in ['algorithm', 'includeAmelogenin', 'scoreFilter']]
+
+    missing_markers = list(set(query_markers) - set(valid_api_markers))
+
+    return missing_markers
+
+
 def _clastr_query(query, query_filter, include_amelogenin, score_filter):
     url = "https://www.cellosaurus.org/str-search/api/query/"
 
@@ -17,8 +64,8 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
         query['algorithm'] = 2
     elif query_filter == "Masters Reference":
         query['algorithm'] = 3
-    
-    query = _pentafix(query, reverse = True)
+
+    query = _pentafix(query, reverse=True)
 
     query['includeAmelogenin'] = include_amelogenin
     query['scoreFilter'] = score_filter
@@ -112,7 +159,7 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
 def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
     url = "https://www.cellosaurus.org/str-search/api/batch/"
 
-    query = [_pentafix(item, reverse = True) for item in query]
+    query = [_pentafix(item, reverse=True) for item in query]
 
     if query_filter == "Tanabe":
         query = [dict(item, **{'algorithm': 1}) for item in query]
@@ -158,6 +205,7 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
             "TH01": "7,9.3",
             "TPOX": "8",
             "vWA": "18",
+            "NoGoodVeryBad": "I'm not a valid marker. However, that is ok. We catch this now."
             }
 
     # # stock from https://www.cellosaurus.org/str-search/help.html#5.1
@@ -194,6 +242,10 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
     #         "vWA": "17,19"
     #         }
 
+    malformed_markers = _valid_marker_check(data.keys())
+
+    print(malformed_markers)
+
     r = _clastr_query(data, 'Tanabe', False, 70)
 
     print(r)
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index ff1c2c5..eae29d5 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -6,7 +6,7 @@
 
 import strprofiler.utils as sp
 from strprofiler.shiny_app.calc_functions import _single_query, _batch_query, _file_query
-from strprofiler.shiny_app.clastr_api import _clastr_query, _clastr_batch_query
+from strprofiler.shiny_app.clastr_api import _valid_marker_check, _clastr_query, _clastr_batch_query
 
 from datetime import date
 import time
@@ -645,6 +645,23 @@ def loaded_example_text():
                                     input.query_filter_threshold(),
                                 )
                 elif input.search_type() == 'Cellosaurus Database (CLASTR)':
+                    malformed_markers = _valid_marker_check(query.keys())
+                    if malformed_markers:
+                        notify_m = ui.modal(
+                            "Markers: {} are incompatible with the CLASTR query."
+                            .format(str(malformed_markers)[1:-1]),
+                            ui.tags.br(),
+                            ui.tags.br(),
+                            "These markers will not be used in the query.",
+                            ui.tags.br(),
+                            ui.tags.br(),
+                            "See: ", ui.tags.a('CLASTR', href=str("https://www.cellosaurus.org/str-search/"), target="_blank"),
+                            " for a complete list of compatible marker names",
+                            title="Inompatible CLASTR Markers",
+                            easy_close=True,
+                            footer=ui.modal_button('Understood')
+                        )
+                        ui.modal_show(notify_m)
                     results = _clastr_query(
                                     query,
                                     input.query_filter(),

From 815036f51066e9e8095d48de3391a518eb68adc8 Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Thu, 16 May 2024 19:26:53 -0400
Subject: [PATCH 10/29] conditional batch options. modal notice for malformed
 markers.

---
 strprofiler/shiny_app/clastr_api.py |   4 +-
 strprofiler/shiny_app/shiny_app.py  | 126 +++++++++++++++++-----------
 2 files changed, 80 insertions(+), 50 deletions(-)

diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
index e3c5157..fd0e9e9 100644
--- a/strprofiler/shiny_app/clastr_api.py
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -44,7 +44,7 @@ def _valid_marker_check(markers):
                          'SE33']
 
     # remove extra fields, if present as keys may come from _clastr_query or other.
-    query_markers = [marker for marker in markers if marker not in ['algorithm', 'includeAmelogenin', 'scoreFilter']]
+    query_markers = [marker for marker in markers if marker not in ['algorithm', 'includeAmelogenin', 'scoreFilter', 'description']]
 
     missing_markers = list(set(query_markers) - set(valid_api_markers))
 
@@ -143,8 +143,6 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
     query_added = pd.concat([query_df, merged]).reset_index(drop=True)
     query_added["bestScore"] = query_added['bestScore'].map("{0:.2f}".format).replace("nan", "")
 
-    # print(query_added.columns)
-
     if 'problem' in query_added.columns:
         query_added = query_added[['accession', 'name', 'species', 'bestScore', 'accession_link', 'problem'] +
                                   [c for c in query_added if c not in
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index eae29d5..10892d9 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -76,6 +76,25 @@ def _link_wrap(name, link, problem):
         return ui.tags.a(name, href=str(link), target="_blank")
 
 
+def notify_modal(marker_list):
+    ui.modal_show(
+        ui.modal(
+            "Marker(s): {} are incompatible with the CLASTR query."
+            .format(str(marker_list)[1:-1]),
+            ui.tags.br(),
+            ui.tags.br(),
+            "The marker(s) will not be used in the query.",
+            ui.tags.br(),
+            ui.tags.br(),
+            "See: ", ui.tags.a('CLASTR', href=str("https://www.cellosaurus.org/str-search/"), target="_blank"),
+            " for a complete list of compatible marker names",
+            title="Inompatible CLASTR Markers",
+            easy_close=True,
+            footer=ui.modal_button('Understood')
+        )
+    )
+
+
 # App Generation ###
 def create_app(db=None):
 
@@ -236,33 +255,61 @@ def create_app(db=None):
                                 {"id": "batch_sidebar"},
                                 ui.tags.h3("Options"),
                                 ui.tags.hr(),
+                                ui.input_select(
+                                        "search_type_batch",
+                                        "Search Type",
+                                        ["STRprofiler Database", "Cellosaurus Database (CLASTR)"],
+                                        width="100%"
+                                ),
                                 ui.card(
                                     ui.input_switch(
                                         "score_amel_batch", "Score Amelogenin", value=False
                                     ),
-                                    ui.input_numeric(
-                                        "mix_threshold_batch",
-                                        "'Mixed' Sample Threshold",
-                                        value=3,
-                                        width="100%",
-                                    ),
-                                    ui.input_numeric(
-                                        "tan_threshold_batch",
-                                        "Tanabe Filter Threshold",
-                                        value=80,
-                                        width="100%",
-                                    ),
-                                    ui.input_numeric(
-                                        "mas_q_threshold_batch",
-                                        "Masters (vs. query) Filter Threshold",
-                                        value=80,
-                                        width="100%",
+                                    ui.panel_conditional(
+                                        "input.search_type_batch === 'STRprofiler Database'",
+                                        ui.input_numeric(
+                                            "mix_threshold_batch",
+                                            "'Mixed' Sample Threshold",
+                                            value=3,
+                                            width="100%",
+                                        ),
+                                        ui.input_numeric(
+                                            "tan_threshold_batch",
+                                            "Tanabe Filter Threshold",
+                                            value=80,
+                                            width="100%",
+                                        ),
+                                        ui.input_numeric(
+                                            "mas_q_threshold_batch",
+                                            "Masters (vs. query) Filter Threshold",
+                                            value=80,
+                                            width="100%",
+                                        ),
+                                        ui.input_numeric(
+                                            "mas_r_threshold_batch",
+                                            "Masters (vs. reference) Filter Threshold",
+                                            value=80,
+                                            width="100%",
+                                        ),
                                     ),
-                                    ui.input_numeric(
-                                        "mas_r_threshold_batch",
-                                        "Masters (vs. reference) Filter Threshold",
-                                        value=80,
-                                        width="100%",
+                                    ui.panel_conditional(
+                                        "input.search_type_batch === 'Cellosaurus Database (CLASTR)'",
+                                        ui.input_select(
+                                            "batch_query_filter",
+                                            "Similarity Score Filter",
+                                            choices=[
+                                                "Tanabe",
+                                                "Masters Query",
+                                                "Masters Reference",
+                                            ],
+                                            width="100%",
+                                        ),
+                                        ui.input_numeric(
+                                            "batch_query_filter_threshold",
+                                            "Similarity Score Filter Threshold",
+                                            value=80,
+                                            width="100%",
+                                        ),
                                     ),
                                 ),
                                 ui.input_file(
@@ -272,12 +319,6 @@ def create_app(db=None):
                                     multiple=False,
                                     width="100%",
                                 ),
-                                ui.input_select(
-                                    "search_type_batch",
-                                    "Search Type",
-                                    ["STRprofiler Database", "Cellosaurus Database (CLASTR)"],
-                                    width="100%"
-                                ),
                                 ui.input_action_button(
                                     "csv_query",
                                     "CSV Query",
@@ -645,23 +686,11 @@ def loaded_example_text():
                                     input.query_filter_threshold(),
                                 )
                 elif input.search_type() == 'Cellosaurus Database (CLASTR)':
+
                     malformed_markers = _valid_marker_check(query.keys())
                     if malformed_markers:
-                        notify_m = ui.modal(
-                            "Markers: {} are incompatible with the CLASTR query."
-                            .format(str(malformed_markers)[1:-1]),
-                            ui.tags.br(),
-                            ui.tags.br(),
-                            "These markers will not be used in the query.",
-                            ui.tags.br(),
-                            ui.tags.br(),
-                            "See: ", ui.tags.a('CLASTR', href=str("https://www.cellosaurus.org/str-search/"), target="_blank"),
-                            " for a complete list of compatible marker names",
-                            title="Inompatible CLASTR Markers",
-                            easy_close=True,
-                            footer=ui.modal_button('Understood')
-                        )
-                        ui.modal_show(notify_m)
+                        notify_modal(malformed_markers)
+
                     results = _clastr_query(
                                     query,
                                     input.query_filter(),
@@ -741,7 +770,6 @@ def download():
         @render.data_frame
         def out_batch_df():
             output_df.set(batch_query_results())
-            print(output_df)
             with reactive.isolate():
                 if input.search_type_batch() == 'STRprofiler Database':
                     try:
@@ -842,13 +870,17 @@ def batch_query_results():
                     )
                 elif input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
                     clastr_query = [(lambda d: d.update(description=key) or d)(val) for (key, val) in query_df.items()]
+
+                    malformed_markers = _valid_marker_check(query_df[next(iter(query_df))].keys())
+                    if malformed_markers:
+                        notify_modal(malformed_markers)
+
                     results = _clastr_batch_query(
                                     clastr_query,
-                                    input.query_filter(),
+                                    input.batch_query_filter(),
                                     input.score_amel_batch(),
-                                    input.query_filter_threshold()
+                                    input.batch_query_filter_threshold()
                                 )
-                    # TO DO: Change to a batch filter option set.
             return results
 
         # File input loading

From 3d5d412c49ed17cd6dd24a5676a0550796f7754c Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Mon, 20 May 2024 15:27:02 -0400
Subject: [PATCH 11/29] global clastr function

---
 pyproject.toml                      |   3 +-
 strprofiler/clastr.py               | 237 ++++++++++++++++++++++++++++
 strprofiler/shiny_app/clastr_api.py |  50 +-----
 strprofiler/shiny_app/shiny_app.py  |  28 ++--
 strprofiler/utils.py                |  54 ++++++-
 tests/Example_clastr_input.csv      |   4 +
 6 files changed, 312 insertions(+), 64 deletions(-)
 create mode 100644 strprofiler/clastr.py
 create mode 100644 tests/Example_clastr_input.csv

diff --git a/pyproject.toml b/pyproject.toml
index 834af42..1c596cd 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -14,7 +14,7 @@ pandas = "^2.2"
 rich-click = "^1.5.2"
 numpy = "^1.26.3"
 openpyxl = "^3.0.10"
-shiny = "^0.8.0"
+shiny = "^0.9.0"
 shinyswatch = "^0.4.2"
 Jinja2 = "^3.1.3"
 faicons = "^0.2.2"
@@ -25,6 +25,7 @@ flatten-json = "^0.1.14"
 
 [tool.poetry.scripts]
 strprofiler = 'strprofiler.strprofiler:strprofiler'
+clastr = 'strprofiler.clastr:clastr_batch_post_request'
 strprofiler-app = 'strprofiler.strprofiler:local_shiny_app'
 
 [build-system]
diff --git a/strprofiler/clastr.py b/strprofiler/clastr.py
new file mode 100644
index 0000000..6365d2f
--- /dev/null
+++ b/strprofiler/clastr.py
@@ -0,0 +1,237 @@
+import rich_click as click
+from pathlib import Path
+from datetime import datetime
+import sys
+import pandas as pd
+import requests
+import json
+import strprofiler.utils as utils
+
+
+@click.command()
+@click.option(
+    "-sa",
+    "--search_algorithm",
+    default=1,
+    help="""Search algorithm to use in the Clastr query.
+            1 - Tanabe, 2 - Masters (vs. query); 3 - Masters (vs. reference)""",
+    show_default=True,
+    type=int,
+)
+@click.option(
+    "-sm",
+    "--scoring_mode",
+    default=1,
+    help="""Search mode to account for missing alleles in query or reference.
+    1 - Non-empty markers, 2 - Query markers, 3 - Reference markers.""",
+    show_default=True,
+    type=int,
+)
+@click.option(
+    "-sf",
+    "--score_filter",
+    default=80,
+    help="Minimum score to report as potential matches in summary table.",
+    show_default=True,
+    type=int,
+)
+@click.option(
+    "-mr",
+    "--max_results",
+    default=200,
+    help="Filter defining the maximum number of results to be returned.",
+    show_default=True,
+    type=int,
+)
+@click.option(
+    "-mm",
+    "--min_markers",
+    default=8,
+    help="Filter defining the minimum number of markers for matches to be reported.",
+    show_default=True,
+    type=int,
+)
+@click.option(
+    "-sm",
+    "--sample_map",
+    help="""Path to sample map in csv format for renaming.
+              First column should be sample names as given in STR file(s),
+              second should be new names to assign. No header.""",
+    type=click.Path(),
+)
+@click.option(
+    "-scol",
+    "--sample_col",
+    help="Name of sample column in STR file(s).",
+    default="Sample",
+    show_default=True,
+    type=str,
+)
+@click.option(
+    "-mcol",
+    "--marker_col",
+    help="""Name of marker column in STR file(s).
+              Only used if format is 'wide'.""",
+    default="Marker",
+    show_default=True,
+    type=str,
+)
+@click.option(
+    "-pfix",
+    "--penta_fix",
+    help="""Whether to try to harmonize PentaE/D allele spelling.""",
+    default=True,
+    show_default=True,
+    type=bool,
+)
+@click.option(
+    "-amel",
+    "--score_amel",
+    help="""Use Amelogenin for similarity scoring.""",
+    default=False,
+    show_default=True,
+    type=bool,
+)
+@click.option(
+    "-o",
+    "--output_dir",
+    default="./STRprofiler",
+    help="Path to the output directory.",
+    show_default=True,
+    type=click.Path(),
+)
+@click.argument("input_files", required=True, type=click.Path(exists=True), nargs=-1)
+@click.version_option()
+def clastr_batch_post_request(
+    input_files,
+    sample_map=None,
+    output_dir="./STRprofiler",
+    search_algorithm=1,
+    scoring_mode=1,
+    score_filter=80,
+    max_results=200,
+    min_markers=8,
+    sample_col="Sample Name",
+    marker_col="Marker",
+    penta_fix=True,
+    score_amel=False,
+):
+    """CLASTR_Query compares STR profiles to the human Cellosaurus knowledge base using the CLASTR REST API..
+
+    :param input_files: List of input STR files in csv, xlsx, tsv, or txt format.
+    :type input_files: click.Path
+
+    :param sample_map: Path to sample map in csv format for renaming.
+        First column should be sample names as given in STR file(s),
+        second should be new names to assign. No header., defaults to None
+    :type sample_map: str, optional
+
+    :param output_dir: Path to output directory, defaults to "./STRprofiler"
+    :type output_dir: str, optional
+
+    :param search_algorithm: Search algorithm to use in the Clastr query, Options: 1 - Tanabe, 2 - Masters (vs. query); 3 - Masters (vs. reference)
+    defaults to 1 (tanabe).
+    :type search_algorithm: int
+
+    :param scoring_mode: Search mode to account for missing alleles in query or reference.
+    Options: 1 - Non-empty markers, 2 - Query markers, 3 - Reference markers.
+    defaults to 1 ( Non-empty markers).
+    :type search_algorithm: int
+
+    :param score_filter: Minimum score to report as potential matches in summary table, defaults to 80
+    :type score_filter: int, optional
+
+    :param max_results: Filter defining the maximum number of results to be returned.
+    Note that in the case of conflicted cell lines, the Best and Worst versions are processed as pairs and only the best
+    score is affected by the threshold. Consequently, some Worst cases with a score below the threshold can still be present in the results.
+        defaults to 200
+    :type mix_threshold: int, optional
+
+    :param min_markers: Filter defining the minimum number of markers for matches to be reported, defaults to 8.
+    :type mix_threshold: int, optional
+
+    :param sample_col: Name of sample column in STR file(s), defaults to "Sample Name"
+    :type sample_col: str, optional
+
+    :param marker_col: Name of marker column in STR file(s).
+        Only used if format is 'wide', defaults to "Marker"
+    :type marker_col: str, optional
+
+    :param penta_fix: Whether to try to harmonize PentaE/D allele spelling, defaults to True
+    :type penta_fix: bool, optional
+
+    :param score_amel: Use Amelogenin for similarity scoring, defaults to False
+    :type score_amel: bool, optional
+    """
+
+    # Make output directory and open file for logging.
+    Path(output_dir).mkdir(parents=True, exist_ok=True)
+    now = datetime.now()
+    dt_string = now.strftime("%Y%m%d.%H_%M_%S")
+    log_file = open(Path(output_dir, "strprofiler.clastrQuery." + dt_string + ".log"), "w")
+
+    print("Search algorithm: " + str(search_algorithm), file=log_file)
+    print("Scoring mode: " + str(scoring_mode), file=log_file)
+    print("Score filter: " + str(marker_col), file=log_file)
+    print("Max results: " + str(max_results), file=log_file)
+    print("Min markers: " + str(min_markers), file=log_file)
+    print("Sample map: " + str(sample_map), file=log_file)
+    print("Sample column: " + str(sample_col), file=log_file)
+    print("Marker column: " + str(marker_col), file=log_file)
+    print("Penta fix: " + str(penta_fix), file=log_file)
+    print("Use amelogenin for scoring: " + str(score_amel) + "\n", file=log_file)
+    print("Full command:", file=log_file)
+
+    print(" ".join(sys.argv) + "\n", file=log_file)
+
+    # Check for sample map.
+    if sample_map is not None:
+        sample_map = pd.read_csv(sample_map, header=None, encoding="unicode_escape")
+
+    # Data ingress.
+    query = utils.str_ingress(
+        paths=input_files,
+        sample_col=sample_col,
+        marker_col=marker_col,
+        sample_map=sample_map,
+        penta_fix=penta_fix,
+    ).to_dict(orient="index")
+
+    clastr_query = [(lambda d: d.update(description=key) or d)(val) for (key, val) in query.items()]
+
+    malformed_markers = utils.validate_api_markers(next(iter(clastr_query)).keys())
+    if malformed_markers:
+        print("Marker(s): {} are incompatible with the CLASTR query. The marker(s) will not be used in the query."
+              .format(str(malformed_markers)[1:-1]), file=log_file)
+        print("See: https://www.cellosaurus.org/str-search/  for a complete list of compatible marker names", file=log_file)
+
+    url = "https://www.cellosaurus.org/str-search/api/batch/"
+
+    clastr_query = [utils._pentafix(item, reverse=True) for item in clastr_query]
+    clastr_query = [dict(item, **{'algorithm': search_algorithm}) for item in clastr_query]
+    clastr_query = [dict(item, **{'scoringMode': scoring_mode}) for item in clastr_query]
+    clastr_query = [dict(item, **{'scoreFilter': score_filter}) for item in clastr_query]
+    clastr_query = [dict(item, **{'includeAmelogenin': score_amel}) for item in clastr_query]
+    clastr_query = [dict(item, **{'minMarkers': min_markers}) for item in clastr_query]
+    clastr_query = [dict(item, **{'maxResults': max_results}) for item in clastr_query]
+    clastr_query = [dict(item, **{'outputFormat': 'xlsx'}) for item in clastr_query]
+
+    print("Querying CLASTR API at: ", url, file=log_file)
+    r = requests.post(url, data=json.dumps(clastr_query))
+
+    try:
+        r.raise_for_status()
+    except requests.exceptions.HTTPError as e:
+        print("Request failed with error: '", e, "'", file=log_file)
+        print("Request failed with error: '", e, "'")
+        return ''
+
+    print("Response from query: ", r.status_code, file=log_file)
+
+    with open(Path(output_dir, "strprofiler.clastrQueryResult." + dt_string + ".xlsx"), "wb") as fd:
+        for chunk in r.iter_content(chunk_size=128):
+            fd.write(chunk)
+
+    print("Results saved: ", Path(output_dir, "strprofiler.clastrQueryResult." + dt_string + ".xlsx"), file=log_file)
+
+    log_file.close()
diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
index fd0e9e9..33047b2 100644
--- a/strprofiler/shiny_app/clastr_api.py
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -2,53 +2,7 @@
 import json
 import pandas as pd
 from flatten_json import flatten
-from strprofiler.utils import _pentafix
-
-
-def _valid_marker_check(markers):
-
-    valid_api_markers = ['Amelogenin',
-                         'CSF1PO',
-                         'D2S1338',
-                         'D3S1358',
-                         'D5S818',
-                         'D7S820',
-                         'D8S1179',
-                         'D13S317',
-                         'D16S539',
-                         'D18S51',
-                         'D19S433',
-                         'D21S11',
-                         'FGA',
-                         'Penta D',
-                         'Penta E',
-                         'PentaD',
-                         'PentaE',
-                         'TH01',
-                         'TPOX',
-                         'vWA',
-                         'D1S1656',
-                         'D2S441',
-                         'D6S1043',
-                         'D10S1248',
-                         'D12S391',
-                         'D22S1045',
-                         'DXS101',
-                         'DYS391',
-                         'F13A01',
-                         'F13B',
-                         'FESFPS',
-                         'LPL',
-                         'Penta C',
-                         'PentaC',
-                         'SE33']
-
-    # remove extra fields, if present as keys may come from _clastr_query or other.
-    query_markers = [marker for marker in markers if marker not in ['algorithm', 'includeAmelogenin', 'scoreFilter', 'description']]
-
-    missing_markers = list(set(query_markers) - set(valid_api_markers))
-
-    return missing_markers
+from strprofiler.utils import _pentafix, validate_api_markers
 
 
 def _clastr_query(query, query_filter, include_amelogenin, score_filter):
@@ -240,7 +194,7 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
     #         "vWA": "17,19"
     #         }
 
-    malformed_markers = _valid_marker_check(data.keys())
+    malformed_markers = validate_api_markers(data.keys())
 
     print(malformed_markers)
 
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 10892d9..3d5c145 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -4,9 +4,9 @@
 import pandas as pd
 from faicons import icon_svg
 
-import strprofiler.utils as sp
+import strprofiler.utils as utils
 from strprofiler.shiny_app.calc_functions import _single_query, _batch_query, _file_query
-from strprofiler.shiny_app.clastr_api import _valid_marker_check, _clastr_query, _clastr_batch_query
+from strprofiler.shiny_app.clastr_api import _clastr_query, _clastr_batch_query
 
 from datetime import date
 import time
@@ -27,7 +27,7 @@ def database_load(file):
         Exception: If the file fails to load or if sample ID names are duplicated.
     """
     try:
-        str_database = sp.str_ingress(
+        str_database = utils.str_ingress(
             [file],  # expects list
             sample_col="Sample",
             marker_col="Marker",
@@ -211,7 +211,7 @@ def create_app(db=None):
                                         width="90%"
                                     ),
                                     ui.tooltip(
-                                        ui.input_action_button(
+                                        ui.input_task_button(
                                             "search",
                                             "Search",
                                             class_="btn-success",
@@ -238,6 +238,7 @@ def create_app(db=None):
                         ui.column(3, ui.tags.h3("Results")),
                         ui.column(1, ui.p("")),
                     ),
+                    # TO DO: Try loading/thinking spinners.
                     ui.column(
                         12,
                         {"id": "res_card"},
@@ -319,7 +320,7 @@ def create_app(db=None):
                                     multiple=False,
                                     width="100%",
                                 ),
-                                ui.input_action_button(
+                                ui.input_task_button(
                                     "csv_query",
                                     "CSV Query",
                                     class_="btn-primary",
@@ -673,7 +674,7 @@ def loaded_example_text():
                     where="afterEnd",
                 )
                 res_click.set(1)
-            thinking = ui.notification_show("Message: API Query Running.", duration=None)
+
             # isolate input.search_type to prevent trigger when options change.
             with reactive.isolate():
                 if input.search_type() == 'STRprofiler Database':
@@ -687,7 +688,7 @@ def loaded_example_text():
                                 )
                 elif input.search_type() == 'Cellosaurus Database (CLASTR)':
 
-                    malformed_markers = _valid_marker_check(query.keys())
+                    malformed_markers = utils.validate_api_markers(query.keys())
                     if malformed_markers:
                         notify_modal(malformed_markers)
 
@@ -697,7 +698,8 @@ def loaded_example_text():
                                     input.score_amel_query(),
                                     input.query_filter_threshold()
                                 )
-            ui.notification_remove(thinking)
+                    # TO DO: Does this need to be async?
+
             return results
 
         @output
@@ -805,7 +807,7 @@ def batch_query_results():
                 ui.remove_ui("#inserted-downloader2")
                 return pd.DataFrame({"": []})
             try:
-                query_df = sp.str_ingress(
+                query_df = utils.str_ingress(
                     [file[0]["datapath"]],
                     sample_col="Sample",
                     marker_col="Marker",
@@ -850,6 +852,7 @@ def batch_query_results():
                             {"id": "inserted-downloader2"},
                             ui.download_button(
                                 "download2", "Download XLSX", width="25%", class_="btn-primary"
+                                # TO DO: Adjust spacing on 'results' section. XLSX button is too far down.
                             ),
                         ),
                         selector="#res_card_batch",
@@ -870,8 +873,7 @@ def batch_query_results():
                     )
                 elif input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
                     clastr_query = [(lambda d: d.update(description=key) or d)(val) for (key, val) in query_df.items()]
-
-                    malformed_markers = _valid_marker_check(query_df[next(iter(query_df))].keys())
+                    malformed_markers = utils.validate_api_markers(query_df[next(iter(query_df))].keys())
                     if malformed_markers:
                         notify_modal(malformed_markers)
 
@@ -881,6 +883,8 @@ def batch_query_results():
                                     input.score_amel_batch(),
                                     input.batch_query_filter_threshold()
                                 )
+                    # TO DO: Does this need to be async?
+
             return results
 
         # File input loading
@@ -935,7 +939,7 @@ def file_query_results():
             if file is None:
                 ui.remove_ui("#inserted-downloader3")
                 return pd.DataFrame({"": []})
-            query_df = sp.str_ingress(
+            query_df = utils.str_ingress(
                 [file[0]["datapath"]],
                 sample_col="Sample",
                 marker_col="Marker",
diff --git a/strprofiler/utils.py b/strprofiler/utils.py
index d3e533d..b137a50 100644
--- a/strprofiler/utils.py
+++ b/strprofiler/utils.py
@@ -35,14 +35,14 @@ def _clean_element(x):
     return ",".join(sorted_elements)
 
 
-def _pentafix(samps_dict, reverse = False):
+def _pentafix(samps_dict, reverse=False):
     """Takes a dictionary of alleles and returns a dictionary with common Penta markers renamed for consistency."""
     if not reverse:
         if "Penta C" in samps_dict.keys():
             samps_dict["PentaC"] = samps_dict.pop("Penta C")
         elif "Penta_C" in samps_dict.keys():
             samps_dict["PentaC"] = samps_dict.pop("Penta_C")
-            
+
         if "Penta D" in samps_dict.keys():
             samps_dict["PentaD"] = samps_dict.pop("Penta D")
         elif "Penta_D" in samps_dict.keys():
@@ -140,7 +140,8 @@ def _make_html(dataframe: pd.DataFrame):
     <div style="width:95%; margin:auto;">
         {table_html}
     </div>
-    <script src="https://code.jquery.com/jquery-3.6.0.slim.min.js" integrity="sha256-u7e5khyithlIdTpu22PHhENmPcRdFiHRjhAuHcs05RI=" crossorigin="anonymous"></script>
+    <script src="https://code.jquery.com/jquery-3.6.0.slim.min.js"
+    integrity="sha256-u7e5khyithlIdTpu22PHhENmPcRdFiHRjhAuHcs05RI=" crossorigin="anonymous"></script>
     <script type="text/javascript" src="https://cdn.datatables.net/1.12.1/js/jquery.dataTables.min.js"></script>
     <script>
         $(document).ready( function () {{
@@ -443,3 +444,50 @@ def make_summary(
     summ_out.update(alleles)
 
     return summ_out
+
+
+def validate_api_markers(markers):
+
+    valid_api_markers = ['Amel',
+                         'Amelogenin',
+                         'CSF1PO',
+                         'D2S1338',
+                         'D3S1358',
+                         'D5S818',
+                         'D7S820',
+                         'D8S1179',
+                         'D13S317',
+                         'D16S539',
+                         'D18S51',
+                         'D19S433',
+                         'D21S11',
+                         'FGA',
+                         'Penta D',
+                         'Penta E',
+                         'PentaD',
+                         'PentaE',
+                         'TH01',
+                         'TPOX',
+                         'vWA',
+                         'D1S1656',
+                         'D2S441',
+                         'D6S1043',
+                         'D10S1248',
+                         'D12S391',
+                         'D22S1045',
+                         'DXS101',
+                         'DYS391',
+                         'F13A01',
+                         'F13B',
+                         'FESFPS',
+                         'LPL',
+                         'Penta C',
+                         'PentaC',
+                         'SE33']
+
+    # remove extra fields, if present as keys may come from _clastr_query or other.
+    query_markers = [marker for marker in markers if marker not in ['algorithm', 'includeAmelogenin', 'scoreFilter', 'description']]
+
+    missing_markers = list(set(query_markers) - set(valid_api_markers))
+
+    return missing_markers
diff --git a/tests/Example_clastr_input.csv b/tests/Example_clastr_input.csv
new file mode 100644
index 0000000..4182e5e
--- /dev/null
+++ b/tests/Example_clastr_input.csv
@@ -0,0 +1,4 @@
+Sample,Amel,CSF1PO,D2S1338,D3S1358,D5S818,D7S820,D8S1179,D13S317,D16S539,D18S51,D19S433,D21S11,FGA,Penta D,Penta E,TH01,TPOX,vWA
+Sample_A,X,"11,12","19,23","15,17","11,12",10,10,"11,12","11,12",13,14,"29,30","20,22","11,13","14,16","6,9","8,9","17,19"
+Sample_B,X,11,,15,"11,12","10,12","10,17",12,"10,11","13,14",,"29,32","20,22",,,9,"8,12","14,16"
+Sample_C,X,"10,11","17,23","15,18","11,12","10,12","12,17","10,12,13.3","9,10,11",13,13,"27,30","18,21",,,"7,9","8,12","14,16"
\ No newline at end of file

From 2696ce9a1f9f78eff2b895c4c8a0528ada768ea7 Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Mon, 20 May 2024 15:49:23 -0400
Subject: [PATCH 12/29] clastr unit test

---
 tests/unit/test_clastr.py | 50 +++++++++++++++++++++++++++++++++++++++
 1 file changed, 50 insertions(+)
 create mode 100644 tests/unit/test_clastr.py

diff --git a/tests/unit/test_clastr.py b/tests/unit/test_clastr.py
new file mode 100644
index 0000000..55c94be
--- /dev/null
+++ b/tests/unit/test_clastr.py
@@ -0,0 +1,50 @@
+import strprofiler.utils as sp
+import pytest
+from pathlib import Path
+import requests
+import json
+import types
+
+THIS_DIR = Path(__file__).parent
+
+exp_clastr = Path(THIS_DIR / "../Example_clastr_input.csv")
+paths = [exp_clastr]
+
+
+@pytest.mark.parametrize("paths", [(paths)])
+def test_clastr(paths):
+
+    # Check that dataframe row and column names are correct when sample map and penta fix applied.
+    df = sp.str_ingress(
+        paths,
+        sample_col="Sample",
+        marker_col="Marker",
+        sample_map=None,
+        penta_fix=True,
+    )
+
+    assert list(df.index) == ["Sample_A", "Sample_B", "Sample_C"]
+    assert set(df.columns) == set(
+        ["Amel", "CSF1PO", "D2S1338", "D3S1358", "D5S818", "D7S820", "D8S1179",
+         "D13S317", "D16S539", "D18S51", "D19S433", "D21S11", "FGA",
+         "PentaD", "PentaE", "TH01", "TPOX", "vWA"]
+    )
+
+    clastr_query = [(lambda d: d.update(description=key) or d)(val) for (key, val) in df.to_dict(orient="index").items()]
+
+    url = "https://www.cellosaurus.org/str-search/api/batch/"
+
+    clastr_query = [sp._pentafix(item, reverse=True) for item in clastr_query]
+    clastr_query = [dict(item, **{'algorithm': 1}) for item in clastr_query]
+    clastr_query = [dict(item, **{'scoringMode': 1}) for item in clastr_query]
+    clastr_query = [dict(item, **{'scoreFilter': 80}) for item in clastr_query]
+    clastr_query = [dict(item, **{'includeAmelogenin': False}) for item in clastr_query]
+    clastr_query = [dict(item, **{'minMarkers': 8}) for item in clastr_query]
+    clastr_query = [dict(item, **{'maxResults': 200}) for item in clastr_query]
+    clastr_query = [dict(item, **{'outputFormat': 'xlsx'}) for item in clastr_query]
+
+    r = requests.post(url, data=json.dumps(clastr_query))
+
+    assert r.status_code == 200
+
+    assert isinstance(r.iter_content(chunk_size=128), types.GeneratorType)

From 3191368b97ea8e3528f88a799b4b53cf9511c72f Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Tue, 21 May 2024 09:40:37 -0400
Subject: [PATCH 13/29] catch non-int thresholds

---
 strprofiler/shiny_app/shiny_app.py | 20 +++++++++++++++++++-
 1 file changed, 19 insertions(+), 1 deletion(-)

diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 3d5c145..ac424b5 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -88,13 +88,21 @@ def notify_modal(marker_list):
             ui.tags.br(),
             "See: ", ui.tags.a('CLASTR', href=str("https://www.cellosaurus.org/str-search/"), target="_blank"),
             " for a complete list of compatible marker names",
-            title="Inompatible CLASTR Markers",
+            title="Incompatible CLASTR Markers",
             easy_close=True,
             footer=ui.modal_button('Understood')
         )
     )
 
 
+def notify_non_int():
+    ui.modal_show(
+        ui.notification_show(
+            'Threshold must be an integer',
+        )
+    )
+
+
 # App Generation ###
 def create_app(db=None):
 
@@ -504,6 +512,16 @@ def database_file():
                 width="100%",
             )
 
+        @reactive.effect
+        @reactive.event(input.query_filter_threshold, input.batch_query_filter_threshold)
+        def _():
+            if not isinstance(input.query_filter_threshold(), int):
+                notify_non_int()
+                ui.update_numeric("query_filter_threshold", value=int(input.query_filter_threshold()))
+            if not isinstance(input.batch_query_filter_threshold(), int):
+                notify_non_int()
+                ui.update_numeric("batch_query_filter_threshold", value=int(input.batch_query_filter_threshold()))
+
         @reactive.effect
         @reactive.event(input.search_type)
         def update_tooltip_msg():

From 27f04c210d5d8f7c066a46ede0d55960cbc1776d Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Fri, 24 May 2024 13:03:08 -0400
Subject: [PATCH 14/29] fix for #25, docstrings added

---
 strprofiler/shiny_app/calc_functions.py | 104 +++++++++++-
 strprofiler/shiny_app/clastr_api.py     | 209 +++++++++++++++---------
 strprofiler/utils.py                    |   6 +
 3 files changed, 243 insertions(+), 76 deletions(-)

diff --git a/strprofiler/shiny_app/calc_functions.py b/strprofiler/shiny_app/calc_functions.py
index f0bd79e..2f3e7e2 100644
--- a/strprofiler/shiny_app/calc_functions.py
+++ b/strprofiler/shiny_app/calc_functions.py
@@ -12,7 +12,39 @@ def _single_query(
     query_filter,
     query_filter_threshold,
 ):
-
+    """
+    :param query: dictionary in the format:
+        {"Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+        }
+    containing query sample markers and alleles.
+    :type query: dict
+    :param str_database: dictionary of dictonaries in the format
+        {ref1: {
+            "Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+            }
+        ref2: {
+            "Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+            }
+        }
+    containing reference database of known sample markers and alleles.
+    :type str_database: dict
+    :param use_amel: use Amelogenin for similarity scoring
+    :type use_amel: bool
+    :param three_allele_threshold: number of markers with >= 2 alleles allowed before a sample is flagged for potential mixing
+    :type three_allele_threshold: int
+    :param query_filter: similiarity score to use. Options are: Tanabe, Masters Query, and Masters Reference
+    :type query_filter: str
+    :param query_filter_threshold: Minimum score to report as potential matches in summary table
+    :type query_filter_threshold: int
+    :return: pd.df containing results from similarity comparison.
+    :rtype: pd.df
+    """
     if query_filter == "Tanabe":
         query_filter_name = "tanabe_score"
         drop_cols = [
@@ -123,7 +155,47 @@ def _batch_query(
     mas_q_threshold,
     mas_r_threshold,
 ):
-
+    """
+    :param query: dictonary of dictionaries in the format
+        {Sample1: {
+            "Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+            }
+        Sample2: {
+            "Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+            }
+        }
+    :type query: dict
+    :param str_database: dictionary of dictonaries in the format
+        {ref1: {
+            "Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+            }
+        ref2: {
+            "Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+            }
+        }
+    containing reference database of known sample markers and alleles.
+    :type str_database: dict
+    :param use_amel: use Amelogenin for similarity scoring
+    :type use_amel: bool
+    :param three_allele_threshold: number of markers with >= 2 alleles allowed before a sample is flagged for potential mixing
+    :type three_allele_threshold: int
+    :param tan_threshold: Minimum Tanabe score to report as potential matches in summary table
+    :type tan_threshold: int
+    :param mas_q_threshold: Minimum Masters (vs. query) score to report as potential matches in summary table
+    :type mas_q_threshold: int
+    :param mas_r_threshold: Minimum Masters (vs. reference) score to report as potential matches in summary table
+    :type mas_r_threshold: int
+    :return: pd.df containing results from similarity comparison.
+    :rtype: pd.df
+    """
     summaries = []
 
     for s in query_df.keys():
@@ -220,7 +292,33 @@ def _file_query(
     mas_q_threshold,
     mas_r_threshold,
 ):
-
+    """
+    :param query: dictonary of dictionaries in the format
+        {Sample1: {
+            "Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+            }
+        Sample2: {
+            "Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+            }
+        }
+    :type query: dict
+    :param use_amel: use Amelogenin for similarity scoring
+    :type use_amel: bool
+    :param three_allele_threshold: number of markers with >= 2 alleles allowed before a sample is flagged for potential mixing
+    :type three_allele_threshold: int
+    :param tan_threshold: Minimum Tanabe score to report as potential matches in summary table
+    :type tan_threshold: int
+    :param mas_q_threshold: Minimum Masters (vs. query) score to report as potential matches in summary table
+    :type mas_q_threshold: int
+    :param mas_r_threshold: Minimum Masters (vs. reference) score to report as potential matches in summary table
+    :type mas_r_threshold: int
+    :return: pd.df containing results from similarity comparison.
+    :rtype: pd.df
+    """
     summaries = []
 
     for s in query_df.keys():
diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
index 33047b2..7b1a137 100644
--- a/strprofiler/shiny_app/clastr_api.py
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -1,11 +1,29 @@
 import requests
 import json
 import pandas as pd
+import numpy as np
 from flatten_json import flatten
 from strprofiler.utils import _pentafix, validate_api_markers
 
 
 def _clastr_query(query, query_filter, include_amelogenin, score_filter):
+    """
+    :param query: dictionary in the format
+        {"Amelogenin": "X,Y",
+            "CSF1PO": "12",
+            ... <additional markers>
+        }
+    Marker names have controlled vocab. Validated with strprofiler/utils:validate_api_markers
+    :type query: dict
+    :param query_filter: similiarity score to use. Options are: Tanabe, Masters Query, and Masters Reference
+    :type query_filter: str
+    :param includeAmelogenin: use Amelogenin for similarity scoring
+    :type includeAmelogenin: bool
+    :param score_filter: Minimum score to report as potential matches in summary table
+    :type score_filter: int
+    :return: pd.df with parsed json output or pd.df with error message.
+    :rtype: pd.df
+    """
     url = "https://www.cellosaurus.org/str-search/api/query/"
 
     dct = {k: [v] for k, v in query.items()}
@@ -49,38 +67,46 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
     flattened = [flatten(d) for d in r.json()['results']]
     df = pd.DataFrame(flattened)
 
-    # profiles[0] has 'bestScore' returns.
-    # Markers within profiles[0] are split by each allele 'value'
-    # First select alles, and then concat alleles by return and marker
-    markers = df.filter(regex='^profiles_0_.*_value').T
-    markers[['A', 'B', 'C', 'markerID', 'E', 'F', 'G']] = markers.index.str.split('_', n=7, expand=False).tolist()
-    markers.drop(['A', 'B', 'C', 'E', 'F', 'G'], axis=1, inplace=True)
-
-    # Melt dataframe to: [markerID, resultID, allele] for cat on markerID/resultID
-    melted_markers = pd.melt(markers, id_vars=['markerID'], var_name='resultID', value_name='allele')
+    # profiles[0] has 'bestScore' returns, but a second return is possible.
+    # per CLASTR there will be at most 2 returns per profile.
+    # Markers within profiles are split into individual 'value':allele pairs.
+    # First select alleles, and then concat alleles by return and marker
+    markers = df.filter(regex='^profiles_*_.*_value').T
+    markers[['A', 'profileID', 'C', 'markerID', 'E', 'F', 'G']] = markers.index.str.split('_', n=7, expand=False).tolist()
+    markers.drop(['A', 'C', 'E', 'F', 'G'], axis=1, inplace=True)
+    # Melt dataframe to: [profileID, markerID, resultID, allele] for cat on profileID/markerID/resultID
+    melted_markers = pd.melt(markers, id_vars=['profileID', 'markerID'], var_name='resultID', value_name='allele')
+
+    # each profile has its own score as well. these also need to be tracked to trace 'best' and 'worst' in multi-return cases.
+    scores = df.filter(regex='^profiles_*_.*_score').T
+    scores[['A', 'profileID', 'C']] = scores.index.str.split('_', n=3, expand=False).tolist()
+    scores.drop(['A', 'C'], axis=1, inplace=True)
+    melted_scores = pd.melt(scores, id_vars=['profileID'], var_name='resultID', value_name='score').dropna()
 
     # Join resultID and markerID index to grouped joined allele strings.
     allele_cat_markers = pd.concat([
-        melted_markers[['resultID', 'markerID']],
-        melted_markers.groupby(['resultID', 'markerID'], as_index=True).transform(lambda x: ','
-                                                                                  .join(map(str, x)).replace(",nan", "").replace("nan", ""))
-    ], axis=1).drop_duplicates(subset=['resultID', 'markerID'])
+        melted_markers[['resultID', 'profileID', 'markerID']],
+        melted_markers.groupby(['resultID', 'profileID', 'markerID'], as_index=True)
+        .transform(lambda x: ','.join(map(str, x)).replace(",nan", "").replace("nan", ""))
+    ], axis=1).drop_duplicates(subset=['resultID', 'profileID', 'markerID'])
+
+    pd.merge(allele_cat_markers, melted_scores,  how='inner', on=['profileID', 'resultID'])
 
-    # Marker names are not consistant across results. MarkerName[1] != the same thing in all cases.
-    # We must track marker name by index by result.
+    # Marker names are not consistant across results. MarkerName[1] != MarkerName[1] in all returns.
+    # We must track marker name by profile, index, and result.
     # The same logic from above applies, split the compound column name string,
-    # Melt on markerID, and then merge with concat allele made above.
+    # Melt on profileID and markerID, and then merge with concat allele made above.
     # Finally, pivot into a table and rejoin to higher level results.
-    marker_names = df.filter(regex='^profiles_0_.*_name').T
-    marker_names[['A', 'B', 'C', 'markerID', 'E']] = marker_names.index.str.split('_', n=5, expand=False).tolist()
-    marker_names.drop(['A', 'B', 'C', 'E'], axis=1, inplace=True)
+    marker_names = df.filter(regex='^profiles_*_.*_name').T
+    marker_names[['A', 'profileID', 'C', 'markerID', 'E']] = marker_names.index.str.split('_', n=5, expand=False).tolist()
+    marker_names.drop(['A', 'C', 'E'], axis=1, inplace=True)
 
-    melted_markers = pd.melt(marker_names, id_vars=['markerID'],
-                             var_name='resultID', value_name='markerName').dropna().drop_duplicates(subset=['markerID', 'resultID'])
+    melted_markers = pd.melt(marker_names, id_vars=['profileID', 'markerID'],
+                             var_name='resultID', value_name='markerName').dropna().drop_duplicates(subset=['profileID', 'markerID', 'resultID'])
 
-    markers_names_alleles = pd.merge(allele_cat_markers, melted_markers,  how='inner', on=['markerID', 'resultID'])
+    markers_names_alleles = pd.merge(allele_cat_markers, melted_markers,  how='inner', on=['profileID', 'markerID', 'resultID'])
 
-    pivot_markers_names_alleles = markers_names_alleles.pivot(index=['resultID'], columns='markerName', values='allele')
+    pivot_markers_names_alleles = markers_names_alleles.pivot(index=['profileID', 'resultID'], columns='markerName', values='allele')
 
     try:
         merged = pd.merge(df[['accession', 'name', 'species', 'bestScore', 'problem']],
@@ -92,23 +118,60 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
 
     merged = _pentafix(merged)
 
-    # add the query line to the top of merged, and reorder columns
+    merged_scored = pd.merge(merged, melted_scores, left_on=['profileID', 'resultID'], right_on=['profileID', 'resultID'])
+
+    # For returns with 2 profiles, annotate which of the pair is best / worst.
+    # group by accession, and mutate a new accession column when multi_return and profile score == bestScore (best)
+    # when multi_return and profile score != bestScore (worst), and all other cases (single returns)
+    merged_scored['multi_group'] = merged_scored.groupby('accession')['accession'].transform('size') > 1
+    merged_scored['new'] = np.where(merged_scored['multi_group'] & (merged_scored['bestScore'] == merged_scored['score']),
+                                    merged_scored['accession'] + " (Best)",
+                                    np.where(merged_scored['bestScore'] != merged_scored['score'],
+                                             merged_scored['accession'] + " (Worst)",
+                                             merged_scored['accession']))
+    merged_scored['accession'] = merged_scored['new']
+
+    # # add the query line to the top of merged_scored, and reorder columns
+    query_added = pd.concat([query_df, merged_scored.drop(['new', 'bestScore', 'multi_group'], axis=1)]).reset_index(drop=True)
 
-    query_added = pd.concat([query_df, merged]).reset_index(drop=True)
-    query_added["bestScore"] = query_added['bestScore'].map("{0:.2f}".format).replace("nan", "")
+    query_added["score"] = query_added['score'].map("{0:.2f}".format).replace("nan", "")
 
     if 'problem' in query_added.columns:
-        query_added = query_added[['accession', 'name', 'species', 'bestScore', 'accession_link', 'problem'] +
+        query_added = query_added[['accession', 'name', 'species', 'score', 'accession_link', 'problem'] +
                                   [c for c in query_added if c not in
-                                   ['accession', 'name', 'species', 'bestScore', 'accession_link', 'problem']]].fillna('')
+                                   ['accession', 'name', 'species', 'score', 'accession_link', 'problem']]].fillna('')
     else:
-        query_added = query_added[['accession', 'name', 'species', 'bestScore', 'accession_link'] +
-                                  [c for c in query_added if c not in ['accession', 'name', 'species', 'bestScore', 'accession_link']]].fillna('')
+        query_added = query_added[['accession', 'name', 'species', 'score', 'accession_link'] +
+                                  [c for c in query_added if c not in ['accession', 'name', 'species', 'score', 'accession_link']]].fillna('')
 
     return query_added
 
 
 def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
+    """
+    :param query: list of dictionaries in the format
+        [{
+            "description": "Example 1",
+            "Amelogenin": "X",
+            ... <additional markers>
+            }, {
+            "description": "Example 2",
+            "Amelogenin": "X, Y",
+            ... <additional markers>
+        }]
+    'description' is a required key.
+    Marker names have controlled vocab. Validated with strprofiler/utils:validate_api_markers
+    :type query: list
+    :param query_filter: similiarity score to use. Options are: Tanabe, Masters Query, and Masters Reference
+    :type query_filter: str
+    :param includeAmelogenin: use Amelogenin for similarity scoring
+    :type includeAmelogenin: bool
+    :param score_filter: Minimum score to report as potential matches in summary table
+    :type score_filter: int
+    :return: valid post request return, or pd.df with error message.
+    Valid post request contains bytes in xlsx format accessed via (r.iter_content(chunk_size=128))
+    :rtype: request result or pd.df
+    """
     url = "https://www.cellosaurus.org/str-search/api/batch/"
 
     query = [_pentafix(item, reverse=True) for item in query]
@@ -139,28 +202,28 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
     # Use above URL for 400 error
 
     # sample J000077451
-    data = {"Amelogenin": "X,Y",
-            "CSF1PO": "12",
-            "D2S1338": "17,19",
-            "D3S1358": "15",
-            "D5S818": "11,12",
-            "D7S820": "11,12",
-            "D8S1179": "12,15",
-            "D13S317": "8",
-            "D16S539": "13",
-            "D18S51": "14",
-            "D19S433": "14",
-            "D21S11": "31,31.2",
-            "FGA": "23",
-            "PentaD": "",
-            "PentaE": "",
-            "TH01": "7,9.3",
-            "TPOX": "8",
-            "vWA": "18",
-            "NoGoodVeryBad": "I'm not a valid marker. However, that is ok. We catch this now."
-            }
+    # data = {"Amelogenin": "X,Y",
+    #         "CSF1PO": "12",
+    #         "D2S1338": "17,19",
+    #         "D3S1358": "15",
+    #         "D5S818": "11,12",
+    #         "D7S820": "11,12",
+    #         "D8S1179": "12,15",
+    #         "D13S317": "8",
+    #         "D16S539": "13",
+    #         "D18S51": "14",
+    #         "D19S433": "14",
+    #         "D21S11": "31,31.2",
+    #         "FGA": "23",
+    #         "PentaD": "",
+    #         "PentaE": "",
+    #         "TH01": "7,9.3",
+    #         "TPOX": "8",
+    #         "vWA": "18",
+    #         "NoGoodVeryBad": "I'm not a valid marker. However, that is ok. We catch this now."
+    #         }
 
-    # # stock from https://www.cellosaurus.org/str-search/help.html#5.1
+    # stock from https://www.cellosaurus.org/str-search/help.html#5.1
     # data = {
     #         "Amelogenin": "X",
     #         "CSF1PO": "13,14",
@@ -173,32 +236,32 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
     #         "vWA": "16"
     #         }
 
-    # # stock example from https://www.cellosaurus.org/str-search/
-    # data = {"Amelogenin": "X",
-    #         "CSF1PO": "11,12",
-    #         "D2S1338": "19,23",
-    #         "D3S1358": "15,17",
-    #         "D5S818": "11,12",
-    #         "D7S820": "10",
-    #         "D8S1179": "10",
-    #         "D13S317": "11,12",
-    #         "D16S539": "11,12",
-    #         "D18S51": "13",
-    #         "D19S433": "14",
-    #         "D21S11": "29,30",
-    #         "FGA": "20,22",
-    #         "PentaD": "11,14",
-    #         "PentaE": "14,16",
-    #         "TH01": "6,9",
-    #         "TPOX": "8,9",
-    #         "vWA": "17,19"
-    #         }
+    # # stock example from https://www.cellosaurus.org/str-search/. Includes profile[0] and profile[1]
+    data = {"Amelogenin": "X",
+            "CSF1PO": "11,12",
+            "D2S1338": "19,23",
+            "D3S1358": "15,17",
+            "D5S818": "11,12",
+            "D7S820": "10",
+            "D8S1179": "10",
+            "D13S317": "11,12",
+            "D16S539": "11,12",
+            "D18S51": "13",
+            "D19S433": "14",
+            "D21S11": "29,30",
+            "FGA": "20,22",
+            "PentaD": "11,13",
+            "PentaE": "14,16",
+            "TH01": "6,9",
+            "TPOX": "8,9",
+            "vWA": "17,19"
+            }
 
     malformed_markers = validate_api_markers(data.keys())
 
     print(malformed_markers)
 
-    r = _clastr_query(data, 'Tanabe', False, 70)
+    r = _clastr_query(data, 'Tanabe', False, 80)
 
     print(r)
 
@@ -292,7 +355,7 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
 #                             },
 #                             ...
 #                     }
-#                     <Note: more than 1 profile possible per result>
+#                     <Note: 2 profiles possible per result>
 #                     <best score result is profile[0]>
 #             }
 #             <result 2 ... n >
diff --git a/strprofiler/utils.py b/strprofiler/utils.py
index b137a50..ef3d927 100644
--- a/strprofiler/utils.py
+++ b/strprofiler/utils.py
@@ -447,6 +447,12 @@ def make_summary(
 
 
 def validate_api_markers(markers):
+    """ Compare list of markers against controlled list of markers names from CLASTR.
+    :param markers: List of markers to compare against controlled marker name list.
+    :type markers: list
+    :return: List of non-compliant marker names.
+    :rtype: list
+    """
 
     valid_api_markers = ['Amel',
                          'Amelogenin',

From 8e1a338b596d171d85c2b5934000ddf4aa625525 Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Fri, 24 May 2024 13:23:38 -0400
Subject: [PATCH 15/29] NoneType catch

---
 strprofiler/shiny_app/shiny_app.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index ac424b5..7ac705a 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -515,10 +515,11 @@ def database_file():
         @reactive.effect
         @reactive.event(input.query_filter_threshold, input.batch_query_filter_threshold)
         def _():
-            if not isinstance(input.query_filter_threshold(), int):
+            if not isinstance(input.query_filter_threshold(), int | None):
+                print(input.query_filter_threshold())
                 notify_non_int()
                 ui.update_numeric("query_filter_threshold", value=int(input.query_filter_threshold()))
-            if not isinstance(input.batch_query_filter_threshold(), int):
+            if not isinstance(input.batch_query_filter_threshold(), int | None):
                 notify_non_int()
                 ui.update_numeric("batch_query_filter_threshold", value=int(input.batch_query_filter_threshold()))
 

From e5e4a30febd8b3b9d206b9cef3827e44fb48ad40 Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Fri, 24 May 2024 15:35:48 -0400
Subject: [PATCH 16/29] doc updates

---
 README.md                           | 74 ++++++++++++++++++++++-------
 strprofiler/clastr.py               |  2 +-
 strprofiler/shiny_app/shiny_app.py  |  2 +-
 strprofiler/shiny_app/www/help.html | 41 +++++++++-------
 strprofiler/shiny_app/www/help.md   | 14 ++++--
 tests/unit/test_clastr.py           | 11 +++++
 6 files changed, 103 insertions(+), 41 deletions(-)

diff --git a/README.md b/README.md
index 154df7a..83b506c 100644
--- a/README.md
+++ b/README.md
@@ -49,24 +49,58 @@ Full usage information can be found by running `strprofiler --help`.
 
  STRprofiler compares STR profiles to each other.  
 
-╭─ Options ─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╮
-│ --tan_threshold    -tanth   FLOAT        Minimum Tanabe score to report as potential matches in summary table. [default: 80]                          │
-│ --mas_q_threshold  -masqth  FLOAT        Minimum Masters (vs. query) score to report as potential matches in summary table. [default: 80]             │
-│ --mas_r_threshold  -masrth  FLOAT        Minimum Masters (vs. reference) score to report as potential matches in summary table. [default: 80]         │
-│ --mix_threshold    -mix     INTEGER      Number of markers with >= 2 alleles allowed before a sample is flagged for potential mixing.                 |
-|                                            [default: 3]                                                                                               │
-│ --sample_map       -sm      PATH         Path to sample map in csv format for renaming. First column should be sample names as given                  |
-|                                            in STR file(s),  second should be new names to assign. No header.                                          │
-│ --database         -db      PATH         Path to an STR database file in csv, xlsx, tsv, or txt format.                                               │
-│ --amel_col         -acol    TEXT         Name of Amelogenin column in STR file(s). [default: AMEL]                                                    │
-│ --sample_col       -scol    TEXT         Name of sample column in STR file(s). [default: Sample]                                                      │
-│ --marker_col       -mcol    TEXT         Name of marker column in STR file(s). Only used if format is 'wide'. [default: Marker]                       │
-│ --penta_fix        -pfix                 Whether to try to harmonize PentaE/D allele spelling. [default: True]                                        │
-│ --score_amel       -amel                 Use Amelogenin for similarity scoring. [default: False]                                                      │
-│ --output_dir       -o       PATH         Path to the output directory. [default: ./STRprofiler]                                                       │
-│ --version                                Show the version and exit.                                                                                   │
-│ --help                                   Show this message and exit.                                                                                  │
-╰───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯
+╭─ Options ─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╮
+│ --tan_threshold    -tanth   FLOAT    Minimum Tanabe score to report as potential matches in summary table. [default: 80]                                                                          │
+│ --mas_q_threshold  -masqth  FLOAT    Minimum Masters (vs. query) score to report as potential matches in summary table. [default: 80]                                                             │
+│ --mas_r_threshold  -masrth  FLOAT    Minimum Masters (vs. reference) score to report as potential matches in summary table. [default: 80]                                                         │
+│ --mix_threshold    -mix     INTEGER  Number of markers with >= 2 alleles allowed before a sample is flagged for potential mixing. [default: 3]                                                    │
+│ --sample_map       -sm      PATH     Path to sample map in csv format for renaming. First column should be sample names as given in STR file(s), second should be new names to assign. No header. │
+│ --database         -db      PATH     Path to an STR database file in csv, xlsx, tsv, or txt format.                                                                                               │
+│ --amel_col         -acol    TEXT     Name of Amelogenin column in STR file(s). [default: AMEL]                                                                                                    │
+│ --sample_col       -scol    TEXT     Name of sample column in STR file(s). [default: Sample]                                                                                                      │
+│ --marker_col       -mcol    TEXT     Name of marker column in STR file(s). Only used if format is 'wide'. [default: Marker]                                                                       │
+│ --penta_fix        -pfix             Whether to try to harmonize PentaE/D allele spelling. [default: True]                                                                                        │
+│ --score_amel       -amel             Use Amelogenin for similarity scoring. [default: False]                                                                                                      │
+│ --output_dir       -o       PATH     Path to the output directory. [default: ./STRprofiler]                                                                                                       │
+│ --version                            Show the version and exit.                                                                                                                                   │
+│ --help                               Show this message and exit.                                                                                                                                  │
+╰───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯
+
+```
+
+**CLASTR**
+
+Additionally, the [Cellosaurus](https://www.cellosaurus.org/description.html) (Bairoch, 2018) cell line database can be queried via the [CLASTR](https://www.cellosaurus.org/str-search/) (Robin, Capes-Davis, and Bairoch, 2019) [REST API](https://www.cellosaurus.org/str-search/help.html#5).  
+
+    Bairoch A. (2018) The Cellosaurus, a cell line knowledge resource. Journal of Biomolecular Techniques. 29:25-38. DOI: 10.7171/jbt.18-2902-002; PMID: 29805321 
+
+    Robin, T., Capes-Davis, A. & Bairoch, A. (2019) CLASTR: the Cellosaurus STR Similarity Search Tool - A Precious Help for Cell Line Authentication. International Journal of Cancer. PubMed: 31444973  DOI: 10.1002/IJC.32639
+
+
+`clastr -sm "SampleMap_exp.csv" -scol "Sample Name" -o ./strprofiler_output STR1.xlsx STR2.csv STR3.txt`
+
+Full usage information can be found by running `clastr --help`.
+
+```bash
+ Usage: clastr [OPTIONS] INPUT_FILES...   
+
+**clastr** compares STR profiles to the human Cellosaurus knowledge base using the CLASTR REST API.  
+
+╭─ Options ───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╮
+│ --search_algorithm  -sa    INTEGER  Search algorithm to use in the Clastr query. 1 - Tanabe, 2 - Masters (vs. query); 3 - Masters (vs. reference) [default: 1]                      │
+│ --scoring_mode      -sm    INTEGER  Search mode to account for missing alleles in query or reference. 1 - Non-empty markers, 2 - Query markers, 3 - Reference markers. [default: 1] │
+│ --score_filter      -sf    INTEGER  Minimum score to report as potential matches in summary table. [default: 80]                                                                    │
+│ --max_results       -mr    INTEGER  Filter defining the maximum number of results to be returned. [default: 200]                                                                    │
+│ --min_markers       -mm    INTEGER  Filter defining the minimum number of markers for matches to be reported. [default: 8]                                                          │
+│ --sample_col        -scol  TEXT     Name of sample column in STR file(s). [default: Sample]                                                                                         │
+│ --marker_col        -mcol  TEXT     Name of marker column in STR file(s). Only used if format is 'wide'. [default: Marker]                                                          │
+│ --penta_fix         -pfix           Whether to try to harmonize PentaE/D allele spelling. [default: True]                                                                           │
+│ --score_amel        -amel           Use Amelogenin for similarity scoring. [default: False]                                                                                         │
+│ --output_dir        -o     PATH     Path to the output directory. [default: ./STRprofiler]                                                                                          │
+│ --version                           Show the version and exit.                                                                                                                      │
+│ --help                              Show this message and exit.                                                                                                                     │
+╰─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯
+
 ```
 
 ## Input Files(s)
@@ -149,6 +183,10 @@ In addition to the marker columns, this output contains the following columns:
 | **masters_query_score** | Masters (vs query) similarity score.                         |
 | **masters_ref_score**   | Masters (vs reference) similarity score.                     |
 
+**clastr**
+
+Output for `clastr` is provided in XLSX format. Results follow the CLASTR format, documented here: https://www.cellosaurus.org/str-search/help.html#4
+
 ## Database Comparison
 
 **STRprofiler** can be also used to compare batches of samples against a larger database of samples. 
diff --git a/strprofiler/clastr.py b/strprofiler/clastr.py
index 6365d2f..32b94a8 100644
--- a/strprofiler/clastr.py
+++ b/strprofiler/clastr.py
@@ -116,7 +116,7 @@ def clastr_batch_post_request(
     penta_fix=True,
     score_amel=False,
 ):
-    """CLASTR_Query compares STR profiles to the human Cellosaurus knowledge base using the CLASTR REST API..
+    """CLASTR_Query compares STR profiles to the human Cellosaurus knowledge base using the CLASTR REST API.
 
     :param input_files: List of input STR files in csv, xlsx, tsv, or txt format.
     :type input_files: click.Path
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 7ac705a..dc066e6 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -753,7 +753,7 @@ def out_result():
                             out_df['link'] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, ''), axis=1)
 
                         out_df = out_df.drop(['accession', 'accession_link', 'species'], axis=1).rename(
-                            columns={"link": "Accession", "name": "Name", "bestScore": "Score"})
+                            columns={"link": "Accession", "name": "Name", "score": "Score"})
 
                         cols = list(out_df.columns)
                         cols = [cols[-1]] + cols[:-1]
diff --git a/strprofiler/shiny_app/www/help.html b/strprofiler/shiny_app/www/help.html
index 513700f..9c618c0 100644
--- a/strprofiler/shiny_app/www/help.html
+++ b/strprofiler/shiny_app/www/help.html
@@ -1528,9 +1528,9 @@ <h2>Default Database</h2>
 <div id="clastr-cellosaurus-api-query" class="section level2">
 <h2>CLASTR / Cellosaurus API Query</h2>
 <p>Query of the <a href="https://www.cellosaurus.org/description.html">Cellosaurus</a>
-(Bairoch, 2018) cell line database is also available for single samples
-via the <a href="https://www.cellosaurus.org/str-search/">CLASTR</a>
-(Robin, Capes-Davis, and Bairoch, 2019) <a href="https://www.cellosaurus.org/str-search/help.html#5">REST
+(Bairoch, 2018) cell line database is also available for single and
+batch samples via the <a href="https://www.cellosaurus.org/str-search/">CLASTR</a> (Robin,
+Capes-Davis, and Bairoch, 2019) <a href="https://www.cellosaurus.org/str-search/help.html#5">REST
 API</a>.</p>
 <hr />
 </div>
@@ -1591,8 +1591,8 @@ <h2>Single Query Report</h2>
 <p>The report is filtered to include only those samples with greater
 than or equal to the <code>Similarity Score Filter Threshold</code>
 defined by the user, and report only the similarity score selected.</p>
-<p>When ‘CLASTR’ is selected as the search type, a report is generated
-with the following fields:</p>
+<p>When <code>Cellosaurus Database (CLASTR)</code> is selected as the
+search type, a report is generated with the following fields:</p>
 <table>
 <colgroup>
 <col width="44%" />
@@ -1683,6 +1683,9 @@ <h2>Batch Query Report</h2>
 <p>The report is filtered to include only those samples with greater
 than or equal to the <code>Similarity Score Filter Thresholds</code>
 defined by the user.</p>
+<p>When <code>Cellosaurus Database (CLASTR)</code> is selected as the
+search type, a report is generated in XLSX format, and can be downloaded
+via the <code>Download XLSX</code> button.</p>
 </div>
 <div id="database-file-managment" class="section level2">
 <h2>Database File Managment</h2>
@@ -1750,19 +1753,21 @@ <h2>Sample Query Options</h2>
 </div>
 <div id="batch-and-file-query-specfic" class="section level2">
 <h2>Batch and File Query Specfic</h2>
-<ul>
-<li>Amelogenin scoring is excluded by default but can be included by
-selecting the option.</li>
-<li>Tanabe Filter Threshold: is the Tanabe score threshold over which a
-sample is considered a match in batch and file queries. [default:
-80]</li>
-<li>Masters (vs. query) Filter Threshold: is the Masters (vs. query)
-score threshold over which a sample is considered a match in batch and
-file queries. [default: 80]</li>
-<li>Masters (vs. reference) Filter Threshold: is the Masters
-(vs. reference) score threshold over which a sample is considered a
-match in batch and file queries. [default: 80]</li>
-</ul>
+<p><code>STRprofiler Database</code> options:<br />
+* Amelogenin scoring is excluded by default but can be included by
+selecting the option. * Tanabe Filter Threshold: is the Tanabe score
+threshold over which a sample is considered a match in batch and file
+queries. [default: 80] * Masters (vs. query) Filter Threshold: is the
+Masters (vs. query) score threshold over which a sample is considered a
+match in batch and file queries. [default: 80] * Masters (vs. reference)
+Filter Threshold: is the Masters (vs. reference) score threshold over
+which a sample is considered a match in batch and file queries.
+[default: 80]</p>
+<p><code>Cellosaurus Database (CLASTR)</code> options:<br />
+* Similarity Score Filter: is the similiarity score used for result
+filtering. [default: Tanabe] * Similarity Score Filter Threshold: is the
+threshold to filter results. Only those samples with &gt;= the threshold
+will appear in results. [default: 80]</p>
 <hr />
 </div>
 </div>
diff --git a/strprofiler/shiny_app/www/help.md b/strprofiler/shiny_app/www/help.md
index 7aac4c7..8a4a161 100644
--- a/strprofiler/shiny_app/www/help.md
+++ b/strprofiler/shiny_app/www/help.md
@@ -23,7 +23,7 @@ Current data underlying the default database were provided by: [The Jackson Labo
 If this app is hosted with a custom database, please contact the host for information on the database source.  
 
 ## CLASTR / Cellosaurus API Query
-Query of the [Cellosaurus](https://www.cellosaurus.org/description.html) (Bairoch, 2018) cell line database is also available for single samples via the [CLASTR](https://www.cellosaurus.org/str-search/) (Robin, Capes-Davis, and Bairoch, 2019) [REST API](https://www.cellosaurus.org/str-search/help.html#5).  
+Query of the [Cellosaurus](https://www.cellosaurus.org/description.html) (Bairoch, 2018) cell line database is also available for single and batch samples via the [CLASTR](https://www.cellosaurus.org/str-search/) (Robin, Capes-Davis, and Bairoch, 2019) [REST API](https://www.cellosaurus.org/str-search/help.html#5).  
 
 ---
 
@@ -42,7 +42,7 @@ For individual samples, a report is generated with the following fields when 'ST
 
 The report is filtered to include only those samples with greater than or equal to the `Similarity Score Filter Threshold` defined by the user, and report only the similarity score selected.    
 
-When 'CLASTR' is selected as the search type, a report is generated with the following fields:  
+When `Cellosaurus Database (CLASTR)` is selected as the search type, a report is generated with the following fields:  
 
 | Output Field | Description |
 | :--- |    :----   |
@@ -69,6 +69,9 @@ For batched samples, a report is summary report is generated. For individual sam
 
 The report is filtered to include only those samples with greater than or equal to the `Similarity Score Filter Thresholds` defined by the user.  
 
+When `Cellosaurus Database (CLASTR)` is selected as the search type, a report is generated in XLSX format, and can be downloaded via the `Download XLSX` button.
+
+
 ## Database File Managment
 
 Users can upload custom database files. The files must be in CSV format. A 'Sample' header must be present, but custom marker names may be used. Note that to score `Amelogenin` using the option provided, there must be a `Amelogenin` header in the uploaded file.  
@@ -116,11 +119,16 @@ For batch samples entered in the File Query tab, `STR Similarity` will generate
 
 ## Batch and File Query Specfic
 
+`STRprofiler Database` options:  
 * Amelogenin scoring is excluded by default but can be included by selecting the option.
 * Tanabe Filter Threshold: is the Tanabe score threshold over which a sample is considered a match in batch and file queries. [default: 80] 
 * Masters (vs. query) Filter Threshold: is the Masters (vs. query) score threshold over which a sample is considered a match in batch and file queries. [default: 80]
 * Masters (vs. reference) Filter Threshold: is the Masters (vs. reference) score threshold over which a sample is considered a match in batch and file queries. [default: 80]
 
+`Cellosaurus Database (CLASTR)` options:  
+* Similarity Score Filter: is the similiarity score used for result filtering. [default: Tanabe]
+* Similarity Score Filter Threshold: is the threshold to filter results. Only those samples with >= the threshold will appear in results. [default: 80]
+
 ---
 
 # References
@@ -130,4 +138,4 @@ Jared Andrews, Mike Lloyd, & Sam Culley. (2024). <a href="https://github.com/j-a
 
 Bairoch A. (2018) The Cellosaurus, a cell line knowledge resource. Journal of Biomolecular Techniques. 29:25-38. DOI: 10.7171/jbt.18-2902-002; PMID: 29805321 
 
-Robin, T., Capes-Davis, A. & Bairoch, A. (2019) CLASTR: the Cellosaurus STR Similarity Search Tool - A Precious Help for Cell Line Authentication. International Journal of Cancer. PubMed: 31444973  DOI: 10.1002/IJC.32639
\ No newline at end of file
+Robin, T., Capes-Davis, A. & Bairoch, A. (2019) CLASTR: the Cellosaurus STR Similarity Search Tool - A Precious Help for Cell Line Authentication. International Journal of Cancer. PubMed: 31444973  DOI: 10.1002/IJC.32639
diff --git a/tests/unit/test_clastr.py b/tests/unit/test_clastr.py
index 55c94be..c6b9cc7 100644
--- a/tests/unit/test_clastr.py
+++ b/tests/unit/test_clastr.py
@@ -48,3 +48,14 @@ def test_clastr(paths):
     assert r.status_code == 200
 
     assert isinstance(r.iter_content(chunk_size=128), types.GeneratorType)
+
+    url = "https://www.cellosaurus.org/str-search/api/batch/%"
+
+    r = requests.post(url, data=json.dumps(clastr_query))
+
+    assert r.status_code == 404
+
+    try:
+        r.raise_for_status()
+    except requests.exceptions.HTTPError as e:
+        assert e

From 26c2883acfbb49927d42d23734a942a58853160b Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Tue, 28 May 2024 16:47:55 -0500
Subject: [PATCH 17/29] Fix #28

---
 strprofiler/shiny_app/shiny_app.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index dc066e6..1b88836 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -515,11 +515,11 @@ def database_file():
         @reactive.effect
         @reactive.event(input.query_filter_threshold, input.batch_query_filter_threshold)
         def _():
-            if not isinstance(input.query_filter_threshold(), int | None):
+            if not isinstance(input.query_filter_threshold(), int) and input.query_filter_threshold() is not None:
                 print(input.query_filter_threshold())
                 notify_non_int()
                 ui.update_numeric("query_filter_threshold", value=int(input.query_filter_threshold()))
-            if not isinstance(input.batch_query_filter_threshold(), int | None):
+            if not isinstance(input.batch_query_filter_threshold(), int) and input.batch_query_filter_threshold() is not None:
                 notify_non_int()
                 ui.update_numeric("batch_query_filter_threshold", value=int(input.batch_query_filter_threshold()))
 

From 38bdb085e78758ee603e85dc7a4e137cb8541026 Mon Sep 17 00:00:00 2001
From: MikeWLloyd <mike.lloyd@jax.org>
Date: Tue, 28 May 2024 19:20:56 -0400
Subject: [PATCH 18/29] remove debug print statement

---
 strprofiler/shiny_app/shiny_app.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 1b88836..208aff2 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -516,7 +516,6 @@ def database_file():
         @reactive.event(input.query_filter_threshold, input.batch_query_filter_threshold)
         def _():
             if not isinstance(input.query_filter_threshold(), int) and input.query_filter_threshold() is not None:
-                print(input.query_filter_threshold())
                 notify_non_int()
                 ui.update_numeric("query_filter_threshold", value=int(input.query_filter_threshold()))
             if not isinstance(input.batch_query_filter_threshold(), int) and input.batch_query_filter_threshold() is not None:

From 4505bd63d014f53a0ff23c566551946e8a997a63 Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Wed, 29 May 2024 17:31:15 -0500
Subject: [PATCH 19/29] linting, minor UI tweaks

---
 strprofiler/clastr.py               |   2 +-
 strprofiler/shiny_app/clastr_api.py | 120 ++++++++--------
 strprofiler/shiny_app/shiny_app.py  | 205 +++++++++++++++-------------
 3 files changed, 172 insertions(+), 155 deletions(-)

diff --git a/strprofiler/clastr.py b/strprofiler/clastr.py
index 32b94a8..2df57d2 100644
--- a/strprofiler/clastr.py
+++ b/strprofiler/clastr.py
@@ -224,7 +224,7 @@ def clastr_batch_post_request(
     except requests.exceptions.HTTPError as e:
         print("Request failed with error: '", e, "'", file=log_file)
         print("Request failed with error: '", e, "'")
-        return ''
+        return ""
 
     print("Response from query: ", r.status_code, file=log_file)
 
diff --git a/strprofiler/shiny_app/clastr_api.py b/strprofiler/shiny_app/clastr_api.py
index 7b1a137..cc755c7 100644
--- a/strprofiler/shiny_app/clastr_api.py
+++ b/strprofiler/shiny_app/clastr_api.py
@@ -28,19 +28,19 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
 
     dct = {k: [v] for k, v in query.items()}
     query_df = pd.DataFrame(dct)
-    query_df['accession'] = 'Query'
+    query_df["accession"] = "Query"
 
     if query_filter == "Tanabe":
-        query['algorithm'] = 1
+        query["algorithm"] = 1
     elif query_filter == "Masters Query":
-        query['algorithm'] = 2
+        query["algorithm"] = 2
     elif query_filter == "Masters Reference":
-        query['algorithm'] = 3
+        query["algorithm"] = 3
 
     query = _pentafix(query, reverse=True)
 
-    query['includeAmelogenin'] = include_amelogenin
-    query['scoreFilter'] = score_filter
+    query["includeAmelogenin"] = include_amelogenin
+    query["scoreFilter"] = score_filter
 
     r = requests.post(url, data=json.dumps(query))
 
@@ -59,90 +59,90 @@ def _clastr_query(query, query_filter, include_amelogenin, score_filter):
     except requests.exceptions.HTTPError as e:
         return pd.DataFrame({"Error": [str(e)]})
 
-    df = pd.DataFrame.from_dict(r.json()['results'])
+    df = pd.DataFrame.from_dict(r.json()["results"])
 
     if df.empty:
         return pd.DataFrame({"No Clastr Result": []})
 
-    flattened = [flatten(d) for d in r.json()['results']]
+    flattened = [flatten(d) for d in r.json()["results"]]
     df = pd.DataFrame(flattened)
 
-    # profiles[0] has 'bestScore' returns, but a second return is possible.
+    # profiles[0] has "bestScore" returns, but a second return is possible.
     # per CLASTR there will be at most 2 returns per profile.
-    # Markers within profiles are split into individual 'value':allele pairs.
+    # Markers within profiles are split into individual "value":allele pairs.
     # First select alleles, and then concat alleles by return and marker
-    markers = df.filter(regex='^profiles_*_.*_value').T
-    markers[['A', 'profileID', 'C', 'markerID', 'E', 'F', 'G']] = markers.index.str.split('_', n=7, expand=False).tolist()
-    markers.drop(['A', 'C', 'E', 'F', 'G'], axis=1, inplace=True)
+    markers = df.filter(regex="^profiles_*_.*_value").T
+    markers[["A", "profileID", "C", "markerID", "E", "F", "G"]] = markers.index.str.split("_", n=7, expand=False).tolist()
+    markers.drop(["A", "C", "E", "F", "G"], axis=1, inplace=True)
     # Melt dataframe to: [profileID, markerID, resultID, allele] for cat on profileID/markerID/resultID
-    melted_markers = pd.melt(markers, id_vars=['profileID', 'markerID'], var_name='resultID', value_name='allele')
+    melted_markers = pd.melt(markers, id_vars=["profileID", "markerID"], var_name="resultID", value_name="allele")
 
-    # each profile has its own score as well. these also need to be tracked to trace 'best' and 'worst' in multi-return cases.
-    scores = df.filter(regex='^profiles_*_.*_score').T
-    scores[['A', 'profileID', 'C']] = scores.index.str.split('_', n=3, expand=False).tolist()
-    scores.drop(['A', 'C'], axis=1, inplace=True)
-    melted_scores = pd.melt(scores, id_vars=['profileID'], var_name='resultID', value_name='score').dropna()
+    # each profile has its own score as well. these also need to be tracked to trace "best" and "worst" in multi-return cases.
+    scores = df.filter(regex="^profiles_*_.*_score").T
+    scores[["A", "profileID", "C"]] = scores.index.str.split("_", n=3, expand=False).tolist()
+    scores.drop(["A", "C"], axis=1, inplace=True)
+    melted_scores = pd.melt(scores, id_vars=["profileID"], var_name="resultID", value_name="score").dropna()
 
     # Join resultID and markerID index to grouped joined allele strings.
     allele_cat_markers = pd.concat([
-        melted_markers[['resultID', 'profileID', 'markerID']],
-        melted_markers.groupby(['resultID', 'profileID', 'markerID'], as_index=True)
-        .transform(lambda x: ','.join(map(str, x)).replace(",nan", "").replace("nan", ""))
-    ], axis=1).drop_duplicates(subset=['resultID', 'profileID', 'markerID'])
+        melted_markers[["resultID", "profileID", "markerID"]],
+        melted_markers.groupby(["resultID", "profileID", "markerID"], as_index=True)
+        .transform(lambda x: ",".join(map(str, x)).replace(",nan", "").replace("nan", ""))
+    ], axis=1).drop_duplicates(subset=["resultID", "profileID", "markerID"])
 
-    pd.merge(allele_cat_markers, melted_scores,  how='inner', on=['profileID', 'resultID'])
+    pd.merge(allele_cat_markers, melted_scores,  how="inner", on=["profileID", "resultID"])
 
     # Marker names are not consistant across results. MarkerName[1] != MarkerName[1] in all returns.
     # We must track marker name by profile, index, and result.
     # The same logic from above applies, split the compound column name string,
     # Melt on profileID and markerID, and then merge with concat allele made above.
     # Finally, pivot into a table and rejoin to higher level results.
-    marker_names = df.filter(regex='^profiles_*_.*_name').T
-    marker_names[['A', 'profileID', 'C', 'markerID', 'E']] = marker_names.index.str.split('_', n=5, expand=False).tolist()
-    marker_names.drop(['A', 'C', 'E'], axis=1, inplace=True)
+    marker_names = df.filter(regex="^profiles_*_.*_name").T
+    marker_names[["A", "profileID", "C", "markerID", "E"]] = marker_names.index.str.split("_", n=5, expand=False).tolist()
+    marker_names.drop(["A", "C", "E"], axis=1, inplace=True)
 
-    melted_markers = pd.melt(marker_names, id_vars=['profileID', 'markerID'],
-                             var_name='resultID', value_name='markerName').dropna().drop_duplicates(subset=['profileID', 'markerID', 'resultID'])
+    melted_markers = pd.melt(marker_names, id_vars=["profileID", "markerID"],
+                             var_name="resultID", value_name="markerName").dropna().drop_duplicates(subset=["profileID", "markerID", "resultID"])
 
-    markers_names_alleles = pd.merge(allele_cat_markers, melted_markers,  how='inner', on=['profileID', 'markerID', 'resultID'])
+    markers_names_alleles = pd.merge(allele_cat_markers, melted_markers,  how="inner", on=["profileID", "markerID", "resultID"])
 
-    pivot_markers_names_alleles = markers_names_alleles.pivot(index=['profileID', 'resultID'], columns='markerName', values='allele')
+    pivot_markers_names_alleles = markers_names_alleles.pivot(index=["profileID", "resultID"], columns="markerName", values="allele")
 
     try:
-        merged = pd.merge(df[['accession', 'name', 'species', 'bestScore', 'problem']],
-                          pivot_markers_names_alleles, left_index=True, right_on='resultID')
+        merged = pd.merge(df[["accession", "name", "species", "bestScore", "problem"]],
+                          pivot_markers_names_alleles, left_index=True, right_on="resultID")
     except KeyError:
-        merged = pd.merge(df[['accession', 'name', 'species', 'bestScore']], pivot_markers_names_alleles, left_index=True, right_on='resultID')
+        merged = pd.merge(df[["accession", "name", "species", "bestScore"]], pivot_markers_names_alleles, left_index=True, right_on="resultID")
 
-    merged['accession_link'] = "https://web.expasy.org/cellosaurus/" + merged['accession']
+    merged["accession_link"] = "https://web.expasy.org/cellosaurus/" + merged["accession"]
 
     merged = _pentafix(merged)
 
-    merged_scored = pd.merge(merged, melted_scores, left_on=['profileID', 'resultID'], right_on=['profileID', 'resultID'])
+    merged_scored = pd.merge(merged, melted_scores, left_on=["profileID", "resultID"], right_on=["profileID", "resultID"])
 
     # For returns with 2 profiles, annotate which of the pair is best / worst.
     # group by accession, and mutate a new accession column when multi_return and profile score == bestScore (best)
     # when multi_return and profile score != bestScore (worst), and all other cases (single returns)
-    merged_scored['multi_group'] = merged_scored.groupby('accession')['accession'].transform('size') > 1
-    merged_scored['new'] = np.where(merged_scored['multi_group'] & (merged_scored['bestScore'] == merged_scored['score']),
-                                    merged_scored['accession'] + " (Best)",
-                                    np.where(merged_scored['bestScore'] != merged_scored['score'],
-                                             merged_scored['accession'] + " (Worst)",
-                                             merged_scored['accession']))
-    merged_scored['accession'] = merged_scored['new']
+    merged_scored["multi_group"] = merged_scored.groupby("accession")["accession"].transform("size") > 1
+    merged_scored["new"] = np.where(merged_scored["multi_group"] & (merged_scored["bestScore"] == merged_scored["score"]),
+                                    merged_scored["accession"] + " (Best)",
+                                    np.where(merged_scored["bestScore"] != merged_scored["score"],
+                                             merged_scored["accession"] + " (Worst)",
+                                             merged_scored["accession"]))
+    merged_scored["accession"] = merged_scored["new"]
 
     # # add the query line to the top of merged_scored, and reorder columns
-    query_added = pd.concat([query_df, merged_scored.drop(['new', 'bestScore', 'multi_group'], axis=1)]).reset_index(drop=True)
+    query_added = pd.concat([query_df, merged_scored.drop(["new", "bestScore", "multi_group"], axis=1)]).reset_index(drop=True)
 
-    query_added["score"] = query_added['score'].map("{0:.2f}".format).replace("nan", "")
+    query_added["score"] = query_added["score"].map("{0:.2f}".format).replace("nan", "")
 
-    if 'problem' in query_added.columns:
-        query_added = query_added[['accession', 'name', 'species', 'score', 'accession_link', 'problem'] +
+    if "problem" in query_added.columns:
+        query_added = query_added[["accession", "name", "species", "score", "accession_link", "problem"] +
                                   [c for c in query_added if c not in
-                                   ['accession', 'name', 'species', 'score', 'accession_link', 'problem']]].fillna('')
+                                   ["accession", "name", "species", "score", "accession_link", "problem"]]].fillna("")
     else:
-        query_added = query_added[['accession', 'name', 'species', 'score', 'accession_link'] +
-                                  [c for c in query_added if c not in ['accession', 'name', 'species', 'score', 'accession_link']]].fillna('')
+        query_added = query_added[["accession", "name", "species", "score", "accession_link"] +
+                                  [c for c in query_added if c not in ["accession", "name", "species", "score", "accession_link"]]].fillna("")
 
     return query_added
 
@@ -177,15 +177,15 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
     query = [_pentafix(item, reverse=True) for item in query]
 
     if query_filter == "Tanabe":
-        query = [dict(item, **{'algorithm': 1}) for item in query]
+        query = [dict(item, **{"algorithm": 1}) for item in query]
     elif query_filter == "Masters Query":
-        query = [dict(item, **{'algorithm': 2}) for item in query]
+        query = [dict(item, **{"algorithm": 2}) for item in query]
     elif query_filter == "Masters Reference":
-        query = [dict(item, **{'algorithm': 2}) for item in query]
+        query = [dict(item, **{"algorithm": 2}) for item in query]
 
-    query = [dict(item, **{'includeAmelogenin': include_amelogenin}) for item in query]
-    query = [dict(item, **{'scoreFilter': score_filter}) for item in query]
-    query = [dict(item, **{'outputFormat': 'xlsx'}) for item in query]
+    query = [dict(item, **{"includeAmelogenin": include_amelogenin}) for item in query]
+    query = [dict(item, **{"scoreFilter": score_filter}) for item in query]
+    query = [dict(item, **{"outputFormat": "xlsx"}) for item in query]
 
     r = requests.post(url, data=json.dumps(query))
 
@@ -197,7 +197,7 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
     return r
 
 
-if __name__ == '__main__':
+if __name__ == "__main__":
     # url = "https://www.cellosaurus.org/str-search/api/query/%"
     # Use above URL for 400 error
 
@@ -261,7 +261,7 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
 
     print(malformed_markers)
 
-    r = _clastr_query(data, 'Tanabe', False, 80)
+    r = _clastr_query(data, "Tanabe", False, 80)
 
     print(r)
 
@@ -290,9 +290,9 @@ def _clastr_batch_query(query, query_filter, include_amelogenin, score_filter):
         "outputFormat": "xlsx"
         }]
 
-    r = _clastr_batch_query(batch_data, 'Tanabe', False, 70)
+    r = _clastr_batch_query(batch_data, "Tanabe", False, 70)
 
-    with open('testing.xlsx', 'wb') as fd:
+    with open("testing.xlsx", "wb") as fd:
         for chunk in r.iter_content(chunk_size=128):
             fd.write(chunk)
 
diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 208aff2..7654528 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -90,7 +90,7 @@ def notify_modal(marker_list):
             " for a complete list of compatible marker names",
             title="Incompatible CLASTR Markers",
             easy_close=True,
-            footer=ui.modal_button('Understood')
+            footer=ui.modal_button("Understood")
         )
     )
 
@@ -98,7 +98,7 @@ def notify_modal(marker_list):
 def notify_non_int():
     ui.modal_show(
         ui.notification_show(
-            'Threshold must be an integer',
+            "Threshold must be an integer",
         )
     )
 
@@ -130,7 +130,7 @@ def create_app(db=None):
     )
 
     app_ui = ui.page_fluid(
-        ui.panel_title('', "STR Profiler"),
+        ui.panel_title("", "STR Profiler"),
         ui.tags.style("#main {padding:12px !important} #sidebar {padding:12px}"),
         ui.tags.style(
             ".h3 {margin-bottom:0.1rem; line-height:1} .card-body {padding-top:6px; padding-bottom:6px}"
@@ -225,7 +225,7 @@ def create_app(db=None):
                                             class_="btn-success",
                                             width="45%",
                                         ),
-                                        "Query STRprofilier Database",
+                                        "Query STRprofiler Database",
                                         id="tt_selected_search",
                                         placement="left",
                                     ),
@@ -263,7 +263,6 @@ def create_app(db=None):
                             ui.panel_sidebar(
                                 {"id": "batch_sidebar"},
                                 ui.tags.h3("Options"),
-                                ui.tags.hr(),
                                 ui.input_select(
                                         "search_type_batch",
                                         "Search Type",
@@ -276,50 +275,62 @@ def create_app(db=None):
                                     ),
                                     ui.panel_conditional(
                                         "input.search_type_batch === 'STRprofiler Database'",
-                                        ui.input_numeric(
-                                            "mix_threshold_batch",
-                                            "'Mixed' Sample Threshold",
-                                            value=3,
-                                            width="100%",
-                                        ),
-                                        ui.input_numeric(
-                                            "tan_threshold_batch",
-                                            "Tanabe Filter Threshold",
-                                            value=80,
-                                            width="100%",
-                                        ),
-                                        ui.input_numeric(
-                                            "mas_q_threshold_batch",
-                                            "Masters (vs. query) Filter Threshold",
-                                            value=80,
-                                            width="100%",
-                                        ),
-                                        ui.input_numeric(
-                                            "mas_r_threshold_batch",
-                                            "Masters (vs. reference) Filter Threshold",
-                                            value=80,
-                                            width="100%",
-                                        ),
+                                        ui.row(
+                                            ui.column(6,
+                                                ui.input_numeric(
+                                                    "mix_threshold_batch",
+                                                    "'Mixed' Sample Threshold",
+                                                    value=3,
+                                                    width="100%",
+                                                ),
+                                                ui.input_numeric(
+                                                    "mas_q_threshold_batch",
+                                                    "Masters (vs. query) Filter Threshold",
+                                                    value=80,
+                                                    width="100%",
+                                                )
+                                            ),
+                                            ui.column(6,
+                                                ui.input_numeric(
+                                                    "tan_threshold_batch",
+                                                    "Tanabe Filter Threshold",
+                                                    value=80,
+                                                    width="100%",
+                                                ),
+                                                ui.input_numeric(
+                                                    "mas_r_threshold_batch",
+                                                    "Masters (vs. reference) Filter Threshold",
+                                                    value=80,
+                                                    width="100%",
+                                                )
+                                            )
+                                        )
                                     ),
                                     ui.panel_conditional(
                                         "input.search_type_batch === 'Cellosaurus Database (CLASTR)'",
-                                        ui.input_select(
-                                            "batch_query_filter",
-                                            "Similarity Score Filter",
-                                            choices=[
-                                                "Tanabe",
-                                                "Masters Query",
-                                                "Masters Reference",
-                                            ],
-                                            width="100%",
-                                        ),
-                                        ui.input_numeric(
-                                            "batch_query_filter_threshold",
-                                            "Similarity Score Filter Threshold",
-                                            value=80,
-                                            width="100%",
-                                        ),
-                                    ),
+                                        ui.row(
+                                            ui.column(6,
+                                                ui.input_select(
+                                                    "batch_query_filter",
+                                                    "Similarity Score Filter",
+                                                    choices=[
+                                                        "Tanabe",
+                                                        "Masters Query",
+                                                        "Masters Reference",
+                                                    ],
+                                                    width="100%"
+                                                )
+                                            ),
+                                            ui.column(6,
+                                                ui.input_numeric(
+                                                    "batch_query_filter_threshold",
+                                                    "Similarity Score Filter Threshold",
+                                                    value=80,
+                                                    width="100%"
+                                                )
+                                            )
+                                        )
+                                    )
                                 ),
                                 ui.input_file(
                                     "file1",
@@ -390,30 +401,36 @@ def create_app(db=None):
                                 ui.input_switch(
                                     "score_amel_file", "Score Amelogenin", value=False
                                 ),
-                                ui.input_numeric(
-                                    "mix_threshold_file",
-                                    "'Mixed' Sample Threshold",
-                                    value=3,
-                                    width="100%",
-                                ),
-                                ui.input_numeric(
-                                    "tan_threshold_file",
-                                    "Tanabe Filter Threshold",
-                                    value=80,
-                                    width="100%",
-                                ),
-                                ui.input_numeric(
-                                    "mas_q_threshold_file",
-                                    "Masters (vs. query) Filter Threshold",
-                                    value=80,
-                                    width="100%",
-                                ),
-                                ui.input_numeric(
-                                    "mas_r_threshold_file",
-                                    "Masters (vs. reference) Filter Threshold",
-                                    value=80,
-                                    width="100%",
-                                ),
+                                ui.row(
+                                    ui.column(6,
+                                        ui.input_numeric(
+                                            "mix_threshold_file",
+                                            "'Mixed' Sample Threshold",
+                                            value=3,
+                                            width="100%",
+                                        ),
+                                        ui.input_numeric(
+                                            "mas_q_threshold_file",
+                                            "Masters (vs. query) Filter Threshold",
+                                            value=80,
+                                            width="100%",
+                                        )
+                                    ),
+                                    ui.column(6,
+                                        ui.input_numeric(
+                                            "tan_threshold_file",
+                                            "Tanabe Filter Threshold",
+                                            value=80,
+                                            width="100%",
+                                        ),
+                                        ui.input_numeric(
+                                            "mas_r_threshold_file",
+                                            "Masters (vs. reference) Filter Threshold",
+                                            value=80,
+                                            width="100%",
+                                        )
+                                    )
+                                )
                             ),
                             ui.input_file(
                                 "file2",
@@ -494,7 +511,7 @@ def server(input, output, session):
         output_df = reactive.value(None)
         demo_vals = reactive.value(None)
         demo_name = reactive.value(None)
-        markers = reactive.value([i for i in list(init_db[next(iter(init_db))].keys()) if not any([e for e in ['Center', 'Passage'] if e in i])])
+        markers = reactive.value([i for i in list(init_db[next(iter(init_db))].keys()) if not any([e for e in ["Center", "Passage"] if e in i])])
 
         @output
         @render.text
@@ -525,10 +542,10 @@ def _():
         @reactive.effect
         @reactive.event(input.search_type)
         def update_tooltip_msg():
-            if input.search_type() == 'STRprofiler Database':
-                ui.update_tooltip("tt_selected_search", 'Query STRprofilier Database', show=False)
-            if input.search_type() == 'Cellosaurus Database (CLASTR)':
-                ui.update_tooltip("tt_selected_search", 'Query Cellosaurus Database via CLASTR API', show=False)
+            if input.search_type() == "STRprofiler Database":
+                ui.update_tooltip("tt_selected_search", "Query STRprofilier Database", show=False)
+            if input.search_type() == "Cellosaurus Database (CLASTR)":
+                ui.update_tooltip("tt_selected_search", "Query Cellosaurus Database via CLASTR API", show=False)
 
         @render.ui
         @reactive.event(markers)
@@ -543,7 +560,7 @@ def _():
             file_check.set(not file_check())
             str_database.set(init_db)
             db_name.set(init_db_name)
-            markers.set([i for i in list(str_database()[next(iter(str_database()))].keys()) if not any([e for e in ['Center', 'Passage'] if e in i])])
+            markers.set([i for i in list(str_database()[next(iter(str_database()))].keys()) if not any([e for e in ["Center", "Passage"] if e in i])])
             ui.remove_ui("#inserted-downloader")
             res_click.set(0)
 
@@ -565,7 +582,7 @@ def _():
             else:
                 return
             str_database.set(database_load(file[0]["datapath"]))
-            markers.set([i for i in list(str_database()[next(iter(str_database()))].keys()) if not any([e for e in ['Center', 'Passage'] if e in i])])
+            markers.set([i for i in list(str_database()[next(iter(str_database()))].keys()) if not any([e for e in ["Center", "Passage"] if e in i])])
             [ui.update_text(marker, value="") for marker in markers()]
             db_file_change.set(True)
             ui.remove_ui("#inserted-downloader")
@@ -695,7 +712,7 @@ def loaded_example_text():
 
             # isolate input.search_type to prevent trigger when options change.
             with reactive.isolate():
-                if input.search_type() == 'STRprofiler Database':
+                if input.search_type() == "STRprofiler Database":
                     results = _single_query(
                                     query,
                                     str_database(),
@@ -704,7 +721,7 @@ def loaded_example_text():
                                     input.query_filter(),
                                     input.query_filter_threshold(),
                                 )
-                elif input.search_type() == 'Cellosaurus Database (CLASTR)':
+                elif input.search_type() == "Cellosaurus Database (CLASTR)":
 
                     malformed_markers = utils.validate_api_markers(query.keys())
                     if malformed_markers:
@@ -727,7 +744,7 @@ def out_result():
             if output_df() is not None:
                 # isolate input.search_type to prevent trigger when options change.
                 with reactive.isolate():
-                    if input.search_type() == 'STRprofiler Database':
+                    if input.search_type() == "STRprofiler Database":
                         out_df = output_df().copy()
                         out_df = out_df.style.set_table_attributes(
                             'class="dataframe shiny-table table w-auto"'
@@ -741,17 +758,17 @@ def out_result():
                             },
                             na_rep=""
                         )
-                    elif input.search_type() == 'Cellosaurus Database (CLASTR)':
+                    elif input.search_type() == "Cellosaurus Database (CLASTR)":
                         out_df = output_df().copy()
-                        if ('No Clastr Result' in out_df.columns) | ('Error' in out_df.columns):
+                        if ("No CLASTR Result" in out_df.columns) | ("Error" in out_df.columns):
                             return out_df
                         try:
-                            out_df['link'] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, x.problem), axis=1)
-                            out_df.drop(columns=['problem'], inplace=True)
+                            out_df["link"] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, x.problem), axis=1)
+                            out_df.drop(columns=["problem"], inplace=True)
                         except Exception:
-                            out_df['link'] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, ''), axis=1)
+                            out_df["link"] = out_df.apply(lambda x: _link_wrap(x.accession, x.accession_link, ''), axis=1)
 
-                        out_df = out_df.drop(['accession', 'accession_link', 'species'], axis=1).rename(
+                        out_df = out_df.drop(["accession", "accession_link", "species"], axis=1).rename(
                             columns={"link": "Accession", "name": "Name", "score": "Score"})
 
                         cols = list(out_df.columns)
@@ -791,7 +808,7 @@ def download():
         def out_batch_df():
             output_df.set(batch_query_results())
             with reactive.isolate():
-                if input.search_type_batch() == 'STRprofiler Database':
+                if input.search_type_batch() == "STRprofiler Database":
                     try:
                         return render.DataTable(output_df())
                     except Exception:
@@ -812,7 +829,7 @@ def out_batch_df():
                         )
                         ui.modal_show(m)
                         return render.DataTable(pd.DataFrame({"Failed Query. Fix Input File": []}))
-                elif input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
+                elif input.search_type_batch() == "Cellosaurus Database (CLASTR)":
                     return render.DataTable(pd.DataFrame({"CASTR Batch Query": ['Download Results']}))
 
         # File input loading
@@ -852,7 +869,7 @@ def batch_query_results():
                 return pd.DataFrame({"Failed Query. Fix Input File": []})
 
             if res_click_file() == 0:
-                if input.search_type_batch() == 'STRprofiler Database':
+                if input.search_type_batch() == "STRprofiler Database":
                     ui.insert_ui(
                         ui.div(
                             {"id": "inserted-downloader2"},
@@ -864,7 +881,7 @@ def batch_query_results():
                         where="beforeEnd",
                     )
                     res_click_file.set(1)
-                elif input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
+                elif input.search_type_batch() == "Cellosaurus Database (CLASTR)":
                     ui.insert_ui(
                         ui.div(
                             {"id": "inserted-downloader2"},
@@ -879,7 +896,7 @@ def batch_query_results():
                     res_click_file.set(1)
 
             with reactive.isolate():
-                if input.search_type_batch() == 'STRprofiler Database':
+                if input.search_type_batch() == "STRprofiler Database":
                     results = _batch_query(
                         query_df,
                         str_database(),
@@ -889,7 +906,7 @@ def batch_query_results():
                         input.mas_q_threshold_batch(),
                         input.mas_r_threshold_batch(),
                     )
-                elif input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
+                elif input.search_type_batch() == "Cellosaurus Database (CLASTR)":
                     clastr_query = [(lambda d: d.update(description=key) or d)(val) for (key, val) in query_df.items()]
                     malformed_markers = utils.validate_api_markers(query_df[next(iter(query_df))].keys())
                     if malformed_markers:
@@ -922,9 +939,9 @@ def _():
         )
         def download2():
             if batch_query_results() is not None:
-                if input.search_type_batch() == 'STRprofiler Database':
+                if input.search_type_batch() == "STRprofiler Database":
                     yield batch_query_results().to_csv(index=False)
-                if input.search_type_batch() == 'Cellosaurus Database (CLASTR)':
+                if input.search_type_batch() == "Cellosaurus Database (CLASTR)":
                     for chunk in batch_query_results().iter_content(chunk_size=128):
                         yield chunk
 

From 2f87d58a1fde72868090663d50d22afd9b10bc2d Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Wed, 29 May 2024 17:55:38 -0500
Subject: [PATCH 20/29] more linting

---
 strprofiler/clastr.py | 14 ++++----
 strprofiler/utils.py  | 76 +++++++++++++++++++++----------------------
 2 files changed, 45 insertions(+), 45 deletions(-)

diff --git a/strprofiler/clastr.py b/strprofiler/clastr.py
index 2df57d2..82719ac 100644
--- a/strprofiler/clastr.py
+++ b/strprofiler/clastr.py
@@ -208,13 +208,13 @@ def clastr_batch_post_request(
     url = "https://www.cellosaurus.org/str-search/api/batch/"
 
     clastr_query = [utils._pentafix(item, reverse=True) for item in clastr_query]
-    clastr_query = [dict(item, **{'algorithm': search_algorithm}) for item in clastr_query]
-    clastr_query = [dict(item, **{'scoringMode': scoring_mode}) for item in clastr_query]
-    clastr_query = [dict(item, **{'scoreFilter': score_filter}) for item in clastr_query]
-    clastr_query = [dict(item, **{'includeAmelogenin': score_amel}) for item in clastr_query]
-    clastr_query = [dict(item, **{'minMarkers': min_markers}) for item in clastr_query]
-    clastr_query = [dict(item, **{'maxResults': max_results}) for item in clastr_query]
-    clastr_query = [dict(item, **{'outputFormat': 'xlsx'}) for item in clastr_query]
+    clastr_query = [dict(item, **{"algorithm": search_algorithm}) for item in clastr_query]
+    clastr_query = [dict(item, **{"scoringMode": scoring_mode}) for item in clastr_query]
+    clastr_query = [dict(item, **{"scoreFilter": score_filter}) for item in clastr_query]
+    clastr_query = [dict(item, **{"includeAmelogenin": score_amel}) for item in clastr_query]
+    clastr_query = [dict(item, **{"minMarkers": min_markers}) for item in clastr_query]
+    clastr_query = [dict(item, **{"maxResults": max_results}) for item in clastr_query]
+    clastr_query = [dict(item, **{"outputFormat": "xlsx"}) for item in clastr_query]
 
     print("Querying CLASTR API at: ", url, file=log_file)
     r = requests.post(url, data=json.dumps(clastr_query))
diff --git a/strprofiler/utils.py b/strprofiler/utils.py
index ef3d927..b4b089d 100644
--- a/strprofiler/utils.py
+++ b/strprofiler/utils.py
@@ -207,7 +207,7 @@ def str_ingress(
         elif path.suffix == ".txt":
             df = pd.read_csv(path, sep="\t")
         else:
-            sys.exit('File extension: ' + path.suffix + ' in file: ' + str(path) + ' is not supported.')
+            sys.exit("File extension: " + path.suffix + " in file: " + str(path) + " is not supported.")
 
         df = df.map(lambda x: x.strip() if isinstance(x, str) else x)
 
@@ -454,45 +454,45 @@ def validate_api_markers(markers):
     :rtype: list
     """
 
-    valid_api_markers = ['Amel',
-                         'Amelogenin',
-                         'CSF1PO',
-                         'D2S1338',
-                         'D3S1358',
-                         'D5S818',
-                         'D7S820',
-                         'D8S1179',
-                         'D13S317',
-                         'D16S539',
-                         'D18S51',
-                         'D19S433',
-                         'D21S11',
-                         'FGA',
-                         'Penta D',
-                         'Penta E',
-                         'PentaD',
-                         'PentaE',
-                         'TH01',
-                         'TPOX',
-                         'vWA',
-                         'D1S1656',
-                         'D2S441',
-                         'D6S1043',
-                         'D10S1248',
-                         'D12S391',
-                         'D22S1045',
-                         'DXS101',
-                         'DYS391',
-                         'F13A01',
-                         'F13B',
-                         'FESFPS',
-                         'LPL',
-                         'Penta C',
-                         'PentaC',
-                         'SE33']
+    valid_api_markers = ["Amel",
+                         "Amelogenin",
+                         "CSF1PO",
+                         "D2S1338",
+                         "D3S1358",
+                         "D5S818",
+                         "D7S820",
+                         "D8S1179",
+                         "D13S317",
+                         "D16S539",
+                         "D18S51",
+                         "D19S433",
+                         "D21S11",
+                         "FGA",
+                         "Penta D",
+                         "Penta E",
+                         "PentaD",
+                         "PentaE",
+                         "TH01",
+                         "TPOX",
+                         "vWA",
+                         "D1S1656",
+                         "D2S441",
+                         "D6S1043",
+                         "D10S1248",
+                         "D12S391",
+                         "D22S1045",
+                         "DXS101",
+                         "DYS391",
+                         "F13A01",
+                         "F13B",
+                         "FESFPS",
+                         "LPL",
+                         "Penta C",
+                         "PentaC",
+                         "SE33"]
 
     # remove extra fields, if present as keys may come from _clastr_query or other.
-    query_markers = [marker for marker in markers if marker not in ['algorithm', 'includeAmelogenin', 'scoreFilter', 'description']]
+    query_markers = [marker for marker in markers if marker not in ["algorithm", "includeAmelogenin", "scoreFilter", "description"]]
 
     missing_markers = list(set(query_markers) - set(valid_api_markers))
 

From 30a36897edb28bc727ef2b57a5b482cd21ebf9df Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Wed, 29 May 2024 17:55:58 -0500
Subject: [PATCH 21/29] Help file typos & formatting

---
 strprofiler/shiny_app/www/help.html | 88 ++++++++++++++++-------------
 strprofiler/shiny_app/www/help.md   | 43 ++++++++------
 2 files changed, 77 insertions(+), 54 deletions(-)

diff --git a/strprofiler/shiny_app/www/help.html b/strprofiler/shiny_app/www/help.html
index 9c618c0..da0279e 100644
--- a/strprofiler/shiny_app/www/help.html
+++ b/strprofiler/shiny_app/www/help.html
@@ -9,9 +9,11 @@
 <meta http-equiv="X-UA-Compatible" content="IE=EDGE" />
 
 
+<meta name="author" content="Michael W. Lloyd, The Jackson Laboratory" />
+<meta name="author" content="Jared Andrews, St. Jude Children’s Research Hospital" />
 
 
-<title>STRprofiler</title>
+<title>STRprofiler Shiny Application Usage</title>
 
 <script>// Pandoc 2.9 adds attributes on both header and div. We remove the former (to
 // be compatible with the behavior of Pandoc < 2.8).
@@ -1501,13 +1503,16 @@
 
 
 
-<h1 class="title toc-ignore">STRprofiler</h1>
-<h3 class="subtitle">This site and tool are intended for research
-purposes only.</h3>
+<h1 class="title toc-ignore">STRprofiler Shiny Application Usage</h1>
+<h4 class="author">Michael W. Lloyd, The Jackson Laboratory</h4>
+<h4 class="author">Jared Andrews, St. Jude Children’s Research
+Hospital</h4>
 
 </div>
 
 
+<p><strong>This site and tool are intended for research purposes
+only.</strong></p>
 <div id="database-queries" class="section level1">
 <h1>Database Queries</h1>
 <p>For a provided sample entered manually in the
@@ -1520,8 +1525,8 @@ <h1>Database Queries</h1>
 of samples is provided.</p>
 <div id="default-database" class="section level2">
 <h2>Default Database</h2>
-<p>Current data underlying the default database were provided by: <a href="https://tumor.informatics.jax.org/mtbwi/pdxSearch.do">The Jackson
-Laboratory PDX program</a></p>
+<p>Current data underlying the default database were provided by <a href="https://tumor.informatics.jax.org/mtbwi/pdxSearch.do">The Jackson
+Laboratory PDX program</a>.</p>
 <p>If this app is hosted with a custom database, please contact the host
 for information on the database source.</p>
 </div>
@@ -1537,7 +1542,7 @@ <h2>CLASTR / Cellosaurus API Query</h2>
 <div id="single-query-report" class="section level2">
 <h2>Single Query Report</h2>
 <p>For individual samples, a report is generated with the following
-fields when ‘STR DB’ is selected as the search type.</p>
+fields when ‘STRprofiler Database’ is selected as the search type.</p>
 <table>
 <colgroup>
 <col width="44%" />
@@ -1584,7 +1589,7 @@ <h2>Single Query Report</h2>
 </tr>
 <tr class="odd">
 <td align="left">Markers 1 … n</td>
-<td align="left">Marker alleles with mismatches highlight.</td>
+<td align="left">Marker alleles with mismatches highlighted.</td>
 </tr>
 </tbody>
 </table>
@@ -1622,7 +1627,7 @@ <h2>Single Query Report</h2>
 </tr>
 <tr class="even">
 <td align="left">Markers 1 … n</td>
-<td align="left">Marker alleles with mismatches highlight.</td>
+<td align="left">Marker alleles with mismatches highlighted.</td>
 </tr>
 </tbody>
 </table>
@@ -1633,9 +1638,7 @@ <h2>Single Query Report</h2>
 </div>
 <div id="batch-query-report" class="section level2">
 <h2>Batch Query Report</h2>
-<p>For batched samples, a report is summary report is generated. For
-individual sample comparison report, enter the individual sample in the
-database query tab.</p>
+<p>For batched samples, a summary report is generated.</p>
 <table>
 <colgroup>
 <col width="44%" />
@@ -1651,8 +1654,9 @@ <h2>Batch Query Report</h2>
 <tr class="odd">
 <td align="left">Mixed Sample</td>
 <td align="left">Flag to indicate sample mixing. Sample mixing is
-determined by the “‘Mixed’ Sample Threshold” option. If more markers are
-tri+</td>
+determined by the “‘Mixed’ Sample Threshold” option. If more markers
+have more than 3 alleles for this number of markers, the sample will be
+flagged as potentially mixed.</td>
 </tr>
 <tr class="even">
 <td align="left">Top Match</td>
@@ -1685,10 +1689,11 @@ <h2>Batch Query Report</h2>
 defined by the user.</p>
 <p>When <code>Cellosaurus Database (CLASTR)</code> is selected as the
 search type, a report is generated in XLSX format, and can be downloaded
-via the <code>Download XLSX</code> button.</p>
+via the <code>Download XLSX</code> button. These results will not be
+displayed in the app window directly, they must be downloaded.</p>
 </div>
-<div id="database-file-managment" class="section level2">
-<h2>Database File Managment</h2>
+<div id="database-file-management" class="section level2">
+<h2>Database File Management</h2>
 <p>Users can upload custom database files. The files must be in CSV
 format. A ‘Sample’ header must be present, but custom marker names may
 be used. Note that to score <code>Amelogenin</code> using the option
@@ -1699,8 +1704,8 @@ <h2>Database File Managment</h2>
 </div>
 <div id="within-file-query" class="section level1">
 <h1>Within File Query</h1>
-<p>For batch samples entered in the File Query tab,
-<code>STR Similarity</code> will generate a report that mirrors the
+<p>For batch samples entered in the <strong>Within File Query</strong>
+tab, <code>STRprofiler</code> will generate a report that mirrors the
 batch query above, except that samples will be queried against each
 other rather than against the database. The report is filtered to
 include only those samples with greater than or equal to the
@@ -1751,33 +1756,40 @@ <h2>Sample Query Options</h2>
 results. [default: 80]</li>
 </ul>
 </div>
-<div id="batch-and-file-query-specfic" class="section level2">
-<h2>Batch and File Query Specfic</h2>
-<p><code>STRprofiler Database</code> options:<br />
-* Amelogenin scoring is excluded by default but can be included by
-selecting the option. * Tanabe Filter Threshold: is the Tanabe score
-threshold over which a sample is considered a match in batch and file
-queries. [default: 80] * Masters (vs. query) Filter Threshold: is the
-Masters (vs. query) score threshold over which a sample is considered a
-match in batch and file queries. [default: 80] * Masters (vs. reference)
-Filter Threshold: is the Masters (vs. reference) score threshold over
-which a sample is considered a match in batch and file queries.
-[default: 80]</p>
-<p><code>Cellosaurus Database (CLASTR)</code> options:<br />
-* Similarity Score Filter: is the similiarity score used for result
-filtering. [default: Tanabe] * Similarity Score Filter Threshold: is the
-threshold to filter results. Only those samples with &gt;= the threshold
-will appear in results. [default: 80]</p>
+<div id="batch-and-file-query-specific" class="section level2">
+<h2>Batch and File Query Specific</h2>
+<p><code>STRprofiler Database</code> options:</p>
+<ul>
+<li>Amelogenin scoring is excluded by default but can be included by
+selecting the option.</li>
+<li>Tanabe Filter Threshold: is the Tanabe score threshold over which a
+sample is considered a match in batch and file queries. [default:
+80]</li>
+<li>Masters (vs. query) Filter Threshold: is the Masters (vs. query)
+score threshold over which a sample is considered a match in batch and
+file queries. [default: 80]</li>
+<li>Masters (vs. reference) Filter Threshold: is the Masters
+(vs. reference) score threshold over which a sample is considered a
+match in batch and file queries. [default: 80]</li>
+</ul>
+<p><code>Cellosaurus Database (CLASTR)</code> options:</p>
+<ul>
+<li>Similarity Score Filter: is the similiarity score used for result
+filtering. [default: Tanabe]</li>
+<li>Similarity Score Filter Threshold: is the threshold to filter
+results. Only those samples with &gt;= the threshold will appear in
+results. [default: 80]</li>
+</ul>
 <hr />
 </div>
 </div>
 <div id="references" class="section level1">
 <h1>References</h1>
-<p><code>strprofiler</code> is provided under the MIT license. If you
+<p><code>STRprofiler</code> is provided under the MIT license. If you
 use this app in your research please cite:<br />
 Jared Andrews, Mike Lloyd, &amp; Sam Culley. (2024).
 <a href="https://github.com/j-andrews7/strprofiler" target="_blank">j-andrews7/strprofiler</a>:
-v0.2.0. Zenodo.
+v0.3.0. Zenodo.
 <a href="https://doi.org/10.5281/zenodo.10544686" target="_blank">https://doi.org/10.5281/zenodo.10544686</a></p>
 <p>Bairoch A. (2018) The Cellosaurus, a cell line knowledge resource.
 Journal of Biomolecular Techniques. 29:25-38. DOI:
diff --git a/strprofiler/shiny_app/www/help.md b/strprofiler/shiny_app/www/help.md
index 8a4a161..09ac014 100644
--- a/strprofiler/shiny_app/www/help.md
+++ b/strprofiler/shiny_app/www/help.md
@@ -1,6 +1,8 @@
 ---
-title: "STRprofiler"
-subtitle: 'This site and tool are intended for research purposes only.'
+title: "STRprofiler Shiny Application Usage"
+author:
+  - "Michael W. Lloyd, The Jackson Laboratory"
+  - "Jared Andrews, St. Jude Children's Research Hospital"
 output: 
   html_document:
     theme: spacelab
@@ -11,6 +13,8 @@ output:
     self_contained: true
 ---
 
+**This site and tool are intended for research purposes only.**
+
 # Database Queries  
 For a provided sample entered manually in the `Database Single Query` or sample(s) uploaded from a batch file in the `Database Batch Query` tab, 
 `STRprofiler` will generate a report that includes the similarity scores (described below) as computed against a database of known STR profiles.  
@@ -18,17 +22,20 @@ For a provided sample entered manually in the `Database Single Query` or sample(
 The report will differ depending on if an individual sample or batch of samples is provided.   
 
 ## Default Database
-Current data underlying the default database were provided by: [The Jackson Laboratory PDX program](https://tumor.informatics.jax.org/mtbwi/pdxSearch.do)  
+
+Current data underlying the default database were provided by [The Jackson Laboratory PDX program](https://tumor.informatics.jax.org/mtbwi/pdxSearch.do).
 
 If this app is hosted with a custom database, please contact the host for information on the database source.  
 
 ## CLASTR / Cellosaurus API Query
+
 Query of the [Cellosaurus](https://www.cellosaurus.org/description.html) (Bairoch, 2018) cell line database is also available for single and batch samples via the [CLASTR](https://www.cellosaurus.org/str-search/) (Robin, Capes-Davis, and Bairoch, 2019) [REST API](https://www.cellosaurus.org/str-search/help.html#5).  
 
 ---
 
 ## Single Query Report
-For individual samples, a report is generated with the following fields when 'STR DB' is selected as the search type.  
+
+For individual samples, a report is generated with the following fields when 'STRprofiler Database' is selected as the search type.  
 
 | Output Field | Description |
 | :--- |    :----   |
@@ -38,7 +45,7 @@ For individual samples, a report is generated with the following fields when 'ST
 | Tanabe Score | Tanabe similarity score between the query and database sample (if Tanabe selected). |
 | Master Query Score | Master 'Query' similarity score between the query and database sample (if Master Query selected). |
 | Master Ref Score | Master 'Reference' similarity score between the query and database sample (if Master Ref selected). |
-| Markers 1 ... n | Marker alleles with mismatches highlight. |
+| Markers 1 ... n | Marker alleles with mismatches highlighted. |
 
 The report is filtered to include only those samples with greater than or equal to the `Similarity Score Filter Threshold` defined by the user, and report only the similarity score selected.    
 
@@ -49,18 +56,19 @@ When `Cellosaurus Database (CLASTR)` is selected as the search type, a report is
 | Accession      | Cellosaurus cell line accession ID. Links are provided to each accession information page. |
 | Name   | Cell line name. |
 | Score | Similarity score between the query and cell line sample. Reported score reflectes the selected Similarity Score Filter. |
-| Markers 1 ... n | Marker alleles with mismatches highlight. |
+| Markers 1 ... n | Marker alleles with mismatches highlighted. |
 
 The report is filtered to include only those samples with greater than or equal to the `Similarity Score Filter Threshold` defined by the user.  
 
 ---
 
 ## Batch Query Report 
-For batched samples, a report is summary report is generated. For individual sample comparison report, enter the individual sample in the database query tab.
+
+For batched samples, a summary report is generated. 
 
 | Output Field | Description |
 | :---        |    :----   |
-| Mixed Sample | Flag to indicate sample mixing. Sample mixing is determined by the "'Mixed' Sample Threshold" option. If more markers are tri+ 
+| Mixed Sample | Flag to indicate sample mixing. Sample mixing is determined by the "'Mixed' Sample Threshold" option. If more markers have more than 3 alleles for this number of markers, the sample will be flagged as potentially mixed. |
 | Top Match |	Name and Tanabe score of top match to sample. |
 | Next Best Match |	Name and Tanabe score of next best match to sample. |
 | Tanabe Matches | Name and Tanabe score of matches above scoring threshold to sample. |
@@ -69,10 +77,10 @@ For batched samples, a report is summary report is generated. For individual sam
 
 The report is filtered to include only those samples with greater than or equal to the `Similarity Score Filter Thresholds` defined by the user.  
 
-When `Cellosaurus Database (CLASTR)` is selected as the search type, a report is generated in XLSX format, and can be downloaded via the `Download XLSX` button.
+When `Cellosaurus Database (CLASTR)` is selected as the search type, a report is generated in XLSX format, and can be downloaded via the `Download XLSX` button. These results will not be displayed in the app window directly, they must be downloaded.
 
 
-## Database File Managment
+## Database File Management
 
 Users can upload custom database files. The files must be in CSV format. A 'Sample' header must be present, but custom marker names may be used. Note that to score `Amelogenin` using the option provided, there must be a `Amelogenin` header in the uploaded file.  
 
@@ -81,12 +89,13 @@ Users can upload custom database files. The files must be in CSV format. A 'Samp
 
 # Within File Query
 
-For batch samples entered in the File Query tab, `STR Similarity` will generate a report that mirrors the batch query above, except that samples will be queried against each other rather than against the database. The report is filtered to include only those samples with greater than or equal to the `Similarity Score Filter Threshold` defined by the user.  
+For batch samples entered in the **Within File Query** tab, `STRprofiler` will generate a report that mirrors the batch query above, except that samples will be queried against each other rather than against the database. The report is filtered to include only those samples with greater than or equal to the `Similarity Score Filter Threshold` defined by the user.  
 
 
 ---
 
 # Reported Similarity Scores
+
 1. <a href="https://www.doi.org/10.11418/jtca1981.18.4_329" target="_blank">Tanabe, AKA the Sørenson-Dice coefficient</a>:  
 
 <p align="center">
@@ -117,15 +126,17 @@ For batch samples entered in the File Query tab, `STR Similarity` will generate
 * Similarity Score Filter: is the similiarity score used for result filtering. [default: Tanabe]
 * Similarity Score Filter Threshold: is the threshold to filter results. Only those samples with >= the threshold will appear in results. [default: 80]
 
-## Batch and File Query Specfic
+## Batch and File Query Specific
+
+`STRprofiler Database` options: 
 
-`STRprofiler Database` options:  
 * Amelogenin scoring is excluded by default but can be included by selecting the option.
 * Tanabe Filter Threshold: is the Tanabe score threshold over which a sample is considered a match in batch and file queries. [default: 80] 
 * Masters (vs. query) Filter Threshold: is the Masters (vs. query) score threshold over which a sample is considered a match in batch and file queries. [default: 80]
 * Masters (vs. reference) Filter Threshold: is the Masters (vs. reference) score threshold over which a sample is considered a match in batch and file queries. [default: 80]
 
-`Cellosaurus Database (CLASTR)` options:  
+`Cellosaurus Database (CLASTR)` options:
+
 * Similarity Score Filter: is the similiarity score used for result filtering. [default: Tanabe]
 * Similarity Score Filter Threshold: is the threshold to filter results. Only those samples with >= the threshold will appear in results. [default: 80]
 
@@ -133,8 +144,8 @@ For batch samples entered in the File Query tab, `STR Similarity` will generate
 
 # References
 
-`strprofiler` is provided under the MIT license. If you use this app in your research please cite:    
-Jared Andrews, Mike Lloyd, & Sam Culley. (2024). <a href="https://github.com/j-andrews7/strprofiler" target="_blank">j-andrews7/strprofiler</a>: v0.2.0. Zenodo. <a href="https://doi.org/10.5281/zenodo.10544686" target="_blank">https://doi.org/10.5281/zenodo.10544686</a>
+`STRprofiler` is provided under the MIT license. If you use this app in your research please cite:    
+Jared Andrews, Mike Lloyd, & Sam Culley. (2024). <a href="https://github.com/j-andrews7/strprofiler" target="_blank">j-andrews7/strprofiler</a>: v0.3.0. Zenodo. <a href="https://doi.org/10.5281/zenodo.10544686" target="_blank">https://doi.org/10.5281/zenodo.10544686</a>
 
 Bairoch A. (2018) The Cellosaurus, a cell line knowledge resource. Journal of Biomolecular Techniques. 29:25-38. DOI: 10.7171/jbt.18-2902-002; PMID: 29805321 
 

From 158b2dea5ea90929339dae6c268eba29c776f193 Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Wed, 29 May 2024 17:57:56 -0500
Subject: [PATCH 22/29] update lock file

---
 poetry.lock | 389 +++++++++++++++++++++++++++++++++++++---------------
 1 file changed, 276 insertions(+), 113 deletions(-)

diff --git a/poetry.lock b/poetry.lock
index d4bed28..094c171 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -2,13 +2,13 @@
 
 [[package]]
 name = "anyio"
-version = "4.3.0"
+version = "4.4.0"
 description = "High level compatibility layer for multiple asynchronous event loop implementations"
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "anyio-4.3.0-py3-none-any.whl", hash = "sha256:048e05d0f6caeed70d731f3db756d35dcc1f35747c8c403364a8332c630441b8"},
-    {file = "anyio-4.3.0.tar.gz", hash = "sha256:f75253795a87df48568485fd18cdd2a3fa5c4f7c5be8e5e36637733fce06fed6"},
+    {file = "anyio-4.4.0-py3-none-any.whl", hash = "sha256:c1b2d8f46a8a812513012e1107cb0e68c17159a7a594208005a57dc776e1bdc7"},
+    {file = "anyio-4.4.0.tar.gz", hash = "sha256:5aadc6a1bbb7cdb0bede386cac5e2940f5e2ff3aa20277e991cf028e0585ce94"},
 ]
 
 [package.dependencies]
@@ -50,6 +50,116 @@ typing-extensions = {version = ">=4", markers = "python_version < \"3.11\""}
 [package.extras]
 tests = ["mypy (>=0.800)", "pytest", "pytest-asyncio"]
 
+[[package]]
+name = "certifi"
+version = "2024.2.2"
+description = "Python package for providing Mozilla's CA Bundle."
+optional = false
+python-versions = ">=3.6"
+files = [
+    {file = "certifi-2024.2.2-py3-none-any.whl", hash = "sha256:dc383c07b76109f368f6106eee2b593b04a011ea4d55f652c6ca24a754d1cdd1"},
+    {file = "certifi-2024.2.2.tar.gz", hash = "sha256:0569859f95fc761b18b45ef421b1290a0f65f147e92a1e5eb3e635f9a5e4e66f"},
+]
+
+[[package]]
+name = "charset-normalizer"
+version = "3.3.2"
+description = "The Real First Universal Charset Detector. Open, modern and actively maintained alternative to Chardet."
+optional = false
+python-versions = ">=3.7.0"
+files = [
+    {file = "charset-normalizer-3.3.2.tar.gz", hash = "sha256:f30c3cb33b24454a82faecaf01b19c18562b1e89558fb6c56de4d9118a032fd5"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:25baf083bf6f6b341f4121c2f3c548875ee6f5339300e08be3f2b2ba1721cdd3"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:06435b539f889b1f6f4ac1758871aae42dc3a8c0e24ac9e60c2384973ad73027"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:9063e24fdb1e498ab71cb7419e24622516c4a04476b17a2dab57e8baa30d6e03"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:6897af51655e3691ff853668779c7bad41579facacf5fd7253b0133308cf000d"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:1d3193f4a680c64b4b6a9115943538edb896edc190f0b222e73761716519268e"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:cd70574b12bb8a4d2aaa0094515df2463cb429d8536cfb6c7ce983246983e5a6"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:8465322196c8b4d7ab6d1e049e4c5cb460d0394da4a27d23cc242fbf0034b6b5"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:a9a8e9031d613fd2009c182b69c7b2c1ef8239a0efb1df3f7c8da66d5dd3d537"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:beb58fe5cdb101e3a055192ac291b7a21e3b7ef4f67fa1d74e331a7f2124341c"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:e06ed3eb3218bc64786f7db41917d4e686cc4856944f53d5bdf83a6884432e12"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-musllinux_1_1_ppc64le.whl", hash = "sha256:2e81c7b9c8979ce92ed306c249d46894776a909505d8f5a4ba55b14206e3222f"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-musllinux_1_1_s390x.whl", hash = "sha256:572c3763a264ba47b3cf708a44ce965d98555f618ca42c926a9c1616d8f34269"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:fd1abc0d89e30cc4e02e4064dc67fcc51bd941eb395c502aac3ec19fab46b519"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-win32.whl", hash = "sha256:3d47fa203a7bd9c5b6cee4736ee84ca03b8ef23193c0d1ca99b5089f72645c73"},
+    {file = "charset_normalizer-3.3.2-cp310-cp310-win_amd64.whl", hash = "sha256:10955842570876604d404661fbccbc9c7e684caf432c09c715ec38fbae45ae09"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:802fe99cca7457642125a8a88a084cef28ff0cf9407060f7b93dca5aa25480db"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:573f6eac48f4769d667c4442081b1794f52919e7edada77495aaed9236d13a96"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:549a3a73da901d5bc3ce8d24e0600d1fa85524c10287f6004fbab87672bf3e1e"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f27273b60488abe721a075bcca6d7f3964f9f6f067c8c4c605743023d7d3944f"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:1ceae2f17a9c33cb48e3263960dc5fc8005351ee19db217e9b1bb15d28c02574"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:65f6f63034100ead094b8744b3b97965785388f308a64cf8d7c34f2f2e5be0c4"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:753f10e867343b4511128c6ed8c82f7bec3bd026875576dfd88483c5c73b2fd8"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:4a78b2b446bd7c934f5dcedc588903fb2f5eec172f3d29e52a9096a43722adfc"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:e537484df0d8f426ce2afb2d0f8e1c3d0b114b83f8850e5f2fbea0e797bd82ae"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:eb6904c354526e758fda7167b33005998fb68c46fbc10e013ca97f21ca5c8887"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-musllinux_1_1_ppc64le.whl", hash = "sha256:deb6be0ac38ece9ba87dea880e438f25ca3eddfac8b002a2ec3d9183a454e8ae"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-musllinux_1_1_s390x.whl", hash = "sha256:4ab2fe47fae9e0f9dee8c04187ce5d09f48eabe611be8259444906793ab7cbce"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:80402cd6ee291dcb72644d6eac93785fe2c8b9cb30893c1af5b8fdd753b9d40f"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-win32.whl", hash = "sha256:7cd13a2e3ddeed6913a65e66e94b51d80a041145a026c27e6bb76c31a853c6ab"},
+    {file = "charset_normalizer-3.3.2-cp311-cp311-win_amd64.whl", hash = "sha256:663946639d296df6a2bb2aa51b60a2454ca1cb29835324c640dafb5ff2131a77"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-macosx_10_9_universal2.whl", hash = "sha256:0b2b64d2bb6d3fb9112bafa732def486049e63de9618b5843bcdd081d8144cd8"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-macosx_10_9_x86_64.whl", hash = "sha256:ddbb2551d7e0102e7252db79ba445cdab71b26640817ab1e3e3648dad515003b"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:55086ee1064215781fff39a1af09518bc9255b50d6333f2e4c74ca09fac6a8f6"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:8f4a014bc36d3c57402e2977dada34f9c12300af536839dc38c0beab8878f38a"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:a10af20b82360ab00827f916a6058451b723b4e65030c5a18577c8b2de5b3389"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:8d756e44e94489e49571086ef83b2bb8ce311e730092d2c34ca8f7d925cb20aa"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:90d558489962fd4918143277a773316e56c72da56ec7aa3dc3dbbe20fdfed15b"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:6ac7ffc7ad6d040517be39eb591cac5ff87416c2537df6ba3cba3bae290c0fed"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:7ed9e526742851e8d5cc9e6cf41427dfc6068d4f5a3bb03659444b4cabf6bc26"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-musllinux_1_1_i686.whl", hash = "sha256:8bdb58ff7ba23002a4c5808d608e4e6c687175724f54a5dade5fa8c67b604e4d"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-musllinux_1_1_ppc64le.whl", hash = "sha256:6b3251890fff30ee142c44144871185dbe13b11bab478a88887a639655be1068"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-musllinux_1_1_s390x.whl", hash = "sha256:b4a23f61ce87adf89be746c8a8974fe1c823c891d8f86eb218bb957c924bb143"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:efcb3f6676480691518c177e3b465bcddf57cea040302f9f4e6e191af91174d4"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-win32.whl", hash = "sha256:d965bba47ddeec8cd560687584e88cf699fd28f192ceb452d1d7ee807c5597b7"},
+    {file = "charset_normalizer-3.3.2-cp312-cp312-win_amd64.whl", hash = "sha256:96b02a3dc4381e5494fad39be677abcb5e6634bf7b4fa83a6dd3112607547001"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:95f2a5796329323b8f0512e09dbb7a1860c46a39da62ecb2324f116fa8fdc85c"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:c002b4ffc0be611f0d9da932eb0f704fe2602a9a949d1f738e4c34c75b0863d5"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:a981a536974bbc7a512cf44ed14938cf01030a99e9b3a06dd59578882f06f985"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:3287761bc4ee9e33561a7e058c72ac0938c4f57fe49a09eae428fd88aafe7bb6"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:42cb296636fcc8b0644486d15c12376cb9fa75443e00fb25de0b8602e64c1714"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:0a55554a2fa0d408816b3b5cedf0045f4b8e1a6065aec45849de2d6f3f8e9786"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:c083af607d2515612056a31f0a8d9e0fcb5876b7bfc0abad3ecd275bc4ebc2d5"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-musllinux_1_1_i686.whl", hash = "sha256:87d1351268731db79e0f8e745d92493ee2841c974128ef629dc518b937d9194c"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-musllinux_1_1_ppc64le.whl", hash = "sha256:bd8f7df7d12c2db9fab40bdd87a7c09b1530128315d047a086fa3ae3435cb3a8"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-musllinux_1_1_s390x.whl", hash = "sha256:c180f51afb394e165eafe4ac2936a14bee3eb10debc9d9e4db8958fe36afe711"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:8c622a5fe39a48f78944a87d4fb8a53ee07344641b0562c540d840748571b811"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-win32.whl", hash = "sha256:db364eca23f876da6f9e16c9da0df51aa4f104a972735574842618b8c6d999d4"},
+    {file = "charset_normalizer-3.3.2-cp37-cp37m-win_amd64.whl", hash = "sha256:86216b5cee4b06df986d214f664305142d9c76df9b6512be2738aa72a2048f99"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-macosx_10_9_universal2.whl", hash = "sha256:6463effa3186ea09411d50efc7d85360b38d5f09b870c48e4600f63af490e56a"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:6c4caeef8fa63d06bd437cd4bdcf3ffefe6738fb1b25951440d80dc7df8c03ac"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:37e55c8e51c236f95b033f6fb391d7d7970ba5fe7ff453dad675e88cf303377a"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:fb69256e180cb6c8a894fee62b3afebae785babc1ee98b81cdf68bbca1987f33"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:ae5f4161f18c61806f411a13b0310bea87f987c7d2ecdbdaad0e94eb2e404238"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:b2b0a0c0517616b6869869f8c581d4eb2dd83a4d79e0ebcb7d373ef9956aeb0a"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:45485e01ff4d3630ec0d9617310448a8702f70e9c01906b0d0118bdf9d124cf2"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:eb00ed941194665c332bf8e078baf037d6c35d7c4f3102ea2d4f16ca94a26dc8"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:2127566c664442652f024c837091890cb1942c30937add288223dc895793f898"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-musllinux_1_1_i686.whl", hash = "sha256:a50aebfa173e157099939b17f18600f72f84eed3049e743b68ad15bd69b6bf99"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-musllinux_1_1_ppc64le.whl", hash = "sha256:4d0d1650369165a14e14e1e47b372cfcb31d6ab44e6e33cb2d4e57265290044d"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-musllinux_1_1_s390x.whl", hash = "sha256:923c0c831b7cfcb071580d3f46c4baf50f174be571576556269530f4bbd79d04"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:06a81e93cd441c56a9b65d8e1d043daeb97a3d0856d177d5c90ba85acb3db087"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-win32.whl", hash = "sha256:6ef1d82a3af9d3eecdba2321dc1b3c238245d890843e040e41e470ffa64c3e25"},
+    {file = "charset_normalizer-3.3.2-cp38-cp38-win_amd64.whl", hash = "sha256:eb8821e09e916165e160797a6c17edda0679379a4be5c716c260e836e122f54b"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:c235ebd9baae02f1b77bcea61bce332cb4331dc3617d254df3323aa01ab47bd4"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:5b4c145409bef602a690e7cfad0a15a55c13320ff7a3ad7ca59c13bb8ba4d45d"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:68d1f8a9e9e37c1223b656399be5d6b448dea850bed7d0f87a8311f1ff3dabb0"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:22afcb9f253dac0696b5a4be4a1c0f8762f8239e21b99680099abd9b2b1b2269"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:e27ad930a842b4c5eb8ac0016b0a54f5aebbe679340c26101df33424142c143c"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:1f79682fbe303db92bc2b1136016a38a42e835d932bab5b3b1bfcfbf0640e519"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:b261ccdec7821281dade748d088bb6e9b69e6d15b30652b74cbbac25e280b796"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:122c7fa62b130ed55f8f285bfd56d5f4b4a5b503609d181f9ad85e55c89f4185"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:d0eccceffcb53201b5bfebb52600a5fb483a20b61da9dbc885f8b103cbe7598c"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-musllinux_1_1_i686.whl", hash = "sha256:9f96df6923e21816da7e0ad3fd47dd8f94b2a5ce594e00677c0013018b813458"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-musllinux_1_1_ppc64le.whl", hash = "sha256:7f04c839ed0b6b98b1a7501a002144b76c18fb1c1850c8b98d458ac269e26ed2"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-musllinux_1_1_s390x.whl", hash = "sha256:34d1c8da1e78d2e001f363791c98a272bb734000fcef47a491c1e3b0505657a8"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:ff8fa367d09b717b2a17a052544193ad76cd49979c805768879cb63d9ca50561"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-win32.whl", hash = "sha256:aed38f6e4fb3f5d6bf81bfa990a07806be9d83cf7bacef998ab1a9bd660a581f"},
+    {file = "charset_normalizer-3.3.2-cp39-cp39-win_amd64.whl", hash = "sha256:b01b88d45a6fcb69667cd6d2f7a9aeb4bf53760d7fc536bf679ec94fe9f3ff3d"},
+    {file = "charset_normalizer-3.3.2-py3-none-any.whl", hash = "sha256:3e4d1f6587322d2788836a99c69062fbb091331ec940e02d12d179c1d53e25fc"},
+]
+
 [[package]]
 name = "click"
 version = "8.1.7"
@@ -118,6 +228,20 @@ htmltools = ">=0.1.4.9002"
 dev = ["black (>=23.1.0)", "flake8 (==3.9.2)", "flake8 (>=6.0.0)", "wheel"]
 test = ["pytest (>=6.2.4)"]
 
+[[package]]
+name = "flatten-json"
+version = "0.1.14"
+description = "Flatten JSON objects"
+optional = false
+python-versions = "*"
+files = [
+    {file = "flatten_json-0.1.14-py3-none-any.whl", hash = "sha256:75e455dbbb5be2431546024039cac094a8ed1dfedcf36ab1e7c9d01459fa410c"},
+    {file = "flatten_json-0.1.14.tar.gz", hash = "sha256:4008b1bd81743e6fcdc29ddbb640f5c1589376116e0c8f36cb4a0003d41fe102"},
+]
+
+[package.dependencies]
+six = "*"
+
 [[package]]
 name = "h11"
 version = "0.14.0"
@@ -131,13 +255,13 @@ files = [
 
 [[package]]
 name = "htmltools"
-version = "0.5.1"
+version = "0.5.2"
 description = "Tools for HTML generation and output."
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "htmltools-0.5.1-py3-none-any.whl", hash = "sha256:bbaa71965d8f3834471d6e0c18f70afe01b40bba01b9f0435d49eba33878d581"},
-    {file = "htmltools-0.5.1.tar.gz", hash = "sha256:6788e1ee3e0a9239fb83bf023ee380adaab071394fc453591cecd1f0bcbf634d"},
+    {file = "htmltools-0.5.2-py3-none-any.whl", hash = "sha256:dfa7594dd63a175ad0a77af713e1120a457ff3a276612448beda5d25869ee337"},
+    {file = "htmltools-0.5.2.tar.gz", hash = "sha256:03d978facd3d275043542ae42b40ededfb3c74ca6986fffcfb83880528033bd3"},
 ]
 
 [package.dependencies]
@@ -145,7 +269,7 @@ packaging = ">=20.9"
 typing-extensions = ">=3.10.0.0"
 
 [package.extras]
-dev = ["Flake8-pyproject", "black (>=23.1.0)", "build", "flake8 (>=6.0.0)", "isort (>=5.11.2)", "pre-commit (>=2.15.0)", "pyright (>=1.1.334)", "wheel"]
+dev = ["Flake8-pyproject", "black (>=24.2.0)", "build", "flake8 (>=6.0.0)", "isort (>=5.11.2)", "pre-commit (>=2.15.0)", "pyright (>=1.1.348)", "wheel"]
 test = ["pytest (>=6.2.4)", "syrupy (>=4.6.0)"]
 
 [[package]]
@@ -161,13 +285,13 @@ files = [
 
 [[package]]
 name = "jinja2"
-version = "3.1.3"
+version = "3.1.4"
 description = "A very fast and expressive template engine."
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "Jinja2-3.1.3-py3-none-any.whl", hash = "sha256:7d6d50dd97d52cbc355597bd845fabfbac3f551e1f99619e39a35ce8c370b5fa"},
-    {file = "Jinja2-3.1.3.tar.gz", hash = "sha256:ac8bd6544d4bb2c9792bf3a159e80bba8fda7f07e81bc3aed565432d5925ba90"},
+    {file = "jinja2-3.1.4-py3-none-any.whl", hash = "sha256:bc5dd2abb727a5319567b7a813e6a2e7318c39f4f487cfe6c89c6f9c7d25197d"},
+    {file = "jinja2-3.1.4.tar.gz", hash = "sha256:4a3aee7acbbe7303aede8e9648d13b8bf88a429282aa6122a993f0ac800cb369"},
 ]
 
 [package.dependencies]
@@ -291,13 +415,13 @@ files = [
 
 [[package]]
 name = "mdit-py-plugins"
-version = "0.4.0"
+version = "0.4.1"
 description = "Collection of plugins for markdown-it-py"
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "mdit_py_plugins-0.4.0-py3-none-any.whl", hash = "sha256:b51b3bb70691f57f974e257e367107857a93b36f322a9e6d44ca5bf28ec2def9"},
-    {file = "mdit_py_plugins-0.4.0.tar.gz", hash = "sha256:d8ab27e9aed6c38aa716819fedfde15ca275715955f8a185a8e1cf90fb1d2c1b"},
+    {file = "mdit_py_plugins-0.4.1-py3-none-any.whl", hash = "sha256:1020dfe4e6bfc2c79fb49ae4e3f5b297f5ccd20f010187acc52af2921e27dc6a"},
+    {file = "mdit_py_plugins-0.4.1.tar.gz", hash = "sha256:834b8ac23d1cd60cec703646ffd22ae97b7955a6d596eb1d304be1e251ae499c"},
 ]
 
 [package.dependencies]
@@ -366,13 +490,13 @@ files = [
 
 [[package]]
 name = "openpyxl"
-version = "3.1.2"
+version = "3.1.3"
 description = "A Python library to read/write Excel 2010 xlsx/xlsm files"
 optional = false
 python-versions = ">=3.6"
 files = [
-    {file = "openpyxl-3.1.2-py2.py3-none-any.whl", hash = "sha256:f91456ead12ab3c6c2e9491cf33ba6d08357d802192379bb482f1033ade496f5"},
-    {file = "openpyxl-3.1.2.tar.gz", hash = "sha256:a6f5977418eff3b2d5500d54d9db50c8277a368436f4e4f8ddb1be3422870184"},
+    {file = "openpyxl-3.1.3-py2.py3-none-any.whl", hash = "sha256:25071b558db709de9e8782c3d3e058af3b23ffb2fc6f40c8f0c45a154eced2c3"},
+    {file = "openpyxl-3.1.3.tar.gz", hash = "sha256:8dd482e5350125b2388070bb2477927be2e8ebc27df61178709bc8c8751da2f9"},
 ]
 
 [package.dependencies]
@@ -478,17 +602,16 @@ wcwidth = "*"
 
 [[package]]
 name = "pygments"
-version = "2.17.2"
+version = "2.18.0"
 description = "Pygments is a syntax highlighting package written in Python."
 optional = false
-python-versions = ">=3.7"
+python-versions = ">=3.8"
 files = [
-    {file = "pygments-2.17.2-py3-none-any.whl", hash = "sha256:b27c2826c47d0f3219f29554824c30c5e8945175d888647acd804ddd04af846c"},
-    {file = "pygments-2.17.2.tar.gz", hash = "sha256:da46cec9fd2de5be3a8a784f434e4c4ab670b4ff54d605c4c2717e9d49c4c367"},
+    {file = "pygments-2.18.0-py3-none-any.whl", hash = "sha256:b8e6aca0523f3ab76fee51799c488e38782ac06eafcf95e7ba832985c8e7b13a"},
+    {file = "pygments-2.18.0.tar.gz", hash = "sha256:786ff802f32e91311bff3889f6e9a86e81505fe99f2735bb6d60ae0c5004f199"},
 ]
 
 [package.extras]
-plugins = ["importlib-metadata"]
 windows-terminal = ["colorama (>=0.4.6)"]
 
 [[package]]
@@ -544,6 +667,27 @@ files = [
 [package.dependencies]
 prompt_toolkit = ">=2.0,<=3.0.36"
 
+[[package]]
+name = "requests"
+version = "2.32.3"
+description = "Python HTTP for Humans."
+optional = false
+python-versions = ">=3.8"
+files = [
+    {file = "requests-2.32.3-py3-none-any.whl", hash = "sha256:70761cfe03c773ceb22aa2f671b4757976145175cdfca038c02654d061d6dcc6"},
+    {file = "requests-2.32.3.tar.gz", hash = "sha256:55365417734eb18255590a9ff9eb97e9e1da868d4ccd6402399eaf68af20a760"},
+]
+
+[package.dependencies]
+certifi = ">=2017.4.17"
+charset-normalizer = ">=2,<4"
+idna = ">=2.5,<4"
+urllib3 = ">=1.21.1,<3"
+
+[package.extras]
+socks = ["PySocks (>=1.5.6,!=1.5.7)"]
+use-chardet-on-py3 = ["chardet (>=3.0.2,<6)"]
+
 [[package]]
 name = "rich"
 version = "13.7.1"
@@ -564,32 +708,33 @@ jupyter = ["ipywidgets (>=7.5.1,<9)"]
 
 [[package]]
 name = "rich-click"
-version = "1.7.4"
+version = "1.8.2"
 description = "Format click help output nicely with rich"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "rich-click-1.7.4.tar.gz", hash = "sha256:7ce5de8e4dc0333aec946113529b3eeb349f2e5d2fafee96b9edf8ee36a01395"},
-    {file = "rich_click-1.7.4-py3-none-any.whl", hash = "sha256:e363655475c60fec5a3e16a1eb618118ed79e666c365a36006b107c17c93ac4e"},
+    {file = "rich_click-1.8.2-py3-none-any.whl", hash = "sha256:b57856f304e4fe0394b82d7ce0784450758f8c8b4e201ccc4320501cc201806b"},
+    {file = "rich_click-1.8.2.tar.gz", hash = "sha256:8e29bdede858b59aa2859a1ab1c4ccbd39ed7ed5870262dae756fba6b5dc72e8"},
 ]
 
 [package.dependencies]
 click = ">=7"
-rich = ">=10.7.0"
+rich = ">=10.7"
 typing-extensions = "*"
 
 [package.extras]
-dev = ["flake8", "flake8-docstrings", "mypy", "packaging", "pre-commit", "pytest", "pytest-cov", "types-setuptools"]
+dev = ["mypy", "packaging", "pre-commit", "pytest", "pytest-cov", "rich-codex", "ruff", "types-setuptools"]
+docs = ["markdown-include", "mkdocs", "mkdocs-glightbox", "mkdocs-material-extensions", "mkdocs-material[imaging] (>=9.5.18,<9.6.0)", "mkdocs-rss-plugin", "mkdocstrings[python]", "rich-codex"]
 
 [[package]]
 name = "shiny"
-version = "0.8.1"
+version = "0.9.0"
 description = "A web development framework for Python."
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "shiny-0.8.1-py3-none-any.whl", hash = "sha256:147806f9c7eee26227ef2b061030a9710204534ac19bd8684065c1b8d49488ce"},
-    {file = "shiny-0.8.1.tar.gz", hash = "sha256:fccb97d69523fdddcb7b6d85cd23a7dc25c9700362a255267f43816a9ddb58cd"},
+    {file = "shiny-0.9.0-py3-none-any.whl", hash = "sha256:2977f595fb6dfe7734678060b6b844ac1fe2701318502d403a89c6250f9847cc"},
+    {file = "shiny-0.9.0.tar.gz", hash = "sha256:add19daeb6d5a43f4f60fbc89affed05f4f4b19ffc7ee252001288aa1724ccf9"},
 ]
 
 [package.dependencies]
@@ -600,6 +745,7 @@ htmltools = ">=0.5.1"
 linkify-it-py = ">=1.0"
 markdown-it-py = ">=1.1.0"
 mdit-py-plugins = ">=0.3.0"
+packaging = ">=20.9"
 python-multipart = [
     {version = ">=0.0.7", markers = "platform_system != \"Emscripten\""},
     {version = "*", markers = "platform_system == \"Emscripten\""},
@@ -614,7 +760,7 @@ websockets = ">=10.0"
 [package.extras]
 dev = ["black (>=24.0)", "flake8 (>=6.0.0)", "flake8-bugbear (>=23.2.13)", "isort (>=5.10.1)", "matplotlib", "numpy", "pandas", "pandas-stubs", "pre-commit (>=2.15.0)", "pyright (>=1.1.348)", "shinyswatch (>=0.2.4)", "wheel"]
 doc = ["griffe (==0.33.0)", "jupyter", "jupyter-client (<8.0.0)", "pydantic (==1.10)", "quartodoc (==0.7.2)", "shinylive", "tabulate"]
-test = ["astropy", "bokeh", "coverage", "duckdb", "folium", "geodatasets", "geopandas", "holoviews", "ipyleaflet", "missingno", "plotly", "plotnine", "psutil", "pytest (>=6.2.4)", "pytest-asyncio (>=0.17.2)", "pytest-cov", "pytest-playwright (>=0.3.0)", "pytest-rerunfailures", "pytest-timeout", "pytest-xdist", "rsconnect-python", "scikit-learn", "seaborn", "shinywidgets", "suntime", "syrupy", "timezonefinder", "xarray"]
+test = ["astropy", "bokeh", "coverage", "duckdb", "faicons", "folium", "geodatasets", "geopandas", "holoviews", "ipyleaflet", "missingno", "palmerpenguins", "plotly", "plotnine", "psutil", "pytest (>=6.2.4)", "pytest-asyncio (>=0.17.2)", "pytest-cov", "pytest-playwright (>=0.3.0)", "pytest-rerunfailures", "pytest-timeout", "pytest-xdist", "rsconnect-python", "scikit-learn", "seaborn", "shinywidgets", "suntime", "syrupy", "timezonefinder", "xarray"]
 
 [[package]]
 name = "shinyswatch"
@@ -680,13 +826,13 @@ full = ["httpx (>=0.22.0)", "itsdangerous", "jinja2", "python-multipart (>=0.0.7
 
 [[package]]
 name = "typing-extensions"
-version = "4.11.0"
+version = "4.12.0"
 description = "Backported and Experimental Type Hints for Python 3.8+"
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "typing_extensions-4.11.0-py3-none-any.whl", hash = "sha256:c1f94d72897edaf4ce775bb7558d5b79d8126906a14ea5ed1635921406c0387a"},
-    {file = "typing_extensions-4.11.0.tar.gz", hash = "sha256:83f085bd5ca59c80295fc2a82ab5dac679cbe02b9f33f7d83af68e241bea51b0"},
+    {file = "typing_extensions-4.12.0-py3-none-any.whl", hash = "sha256:b349c66bea9016ac22978d800cfff206d5f9816951f12a7d0ec5578b0a819594"},
+    {file = "typing_extensions-4.12.0.tar.gz", hash = "sha256:8cbcdc8606ebcb0d95453ad7dc5065e6237b6aa230a31e81d0f440c30fed5fd8"},
 ]
 
 [[package]]
@@ -714,15 +860,32 @@ files = [
 [package.extras]
 test = ["coverage", "pytest", "pytest-cov"]
 
+[[package]]
+name = "urllib3"
+version = "2.2.1"
+description = "HTTP library with thread-safe connection pooling, file post, and more."
+optional = false
+python-versions = ">=3.8"
+files = [
+    {file = "urllib3-2.2.1-py3-none-any.whl", hash = "sha256:450b20ec296a467077128bff42b73080516e71b56ff59a60a02bef2232c4fa9d"},
+    {file = "urllib3-2.2.1.tar.gz", hash = "sha256:d0570876c61ab9e520d776c38acbbb5b05a776d3f9ff98a5c8fd5162a444cf19"},
+]
+
+[package.extras]
+brotli = ["brotli (>=1.0.9)", "brotlicffi (>=0.8.0)"]
+h2 = ["h2 (>=4,<5)"]
+socks = ["pysocks (>=1.5.6,!=1.5.7,<2.0)"]
+zstd = ["zstandard (>=0.18.0)"]
+
 [[package]]
 name = "uvicorn"
-version = "0.29.0"
+version = "0.30.0"
 description = "The lightning-fast ASGI server."
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "uvicorn-0.29.0-py3-none-any.whl", hash = "sha256:2c2aac7ff4f4365c206fd773a39bf4ebd1047c238f8b8268ad996829323473de"},
-    {file = "uvicorn-0.29.0.tar.gz", hash = "sha256:6a69214c0b6a087462412670b3ef21224fa48cae0e452b5883e8e8bdfdd11dd0"},
+    {file = "uvicorn-0.30.0-py3-none-any.whl", hash = "sha256:78fa0b5f56abb8562024a59041caeb555c86e48d0efdd23c3fe7de7a4075bdab"},
+    {file = "uvicorn-0.30.0.tar.gz", hash = "sha256:f678dec4fa3a39706bbf49b9ec5fc40049d42418716cea52b53f07828a60aa37"},
 ]
 
 [package.dependencies]
@@ -735,86 +898,86 @@ standard = ["colorama (>=0.4)", "httptools (>=0.5.0)", "python-dotenv (>=0.13)",
 
 [[package]]
 name = "watchfiles"
-version = "0.21.0"
+version = "0.22.0"
 description = "Simple, modern and high performance file watching and code reload in python."
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "watchfiles-0.21.0-cp310-cp310-macosx_10_7_x86_64.whl", hash = "sha256:27b4035013f1ea49c6c0b42d983133b136637a527e48c132d368eb19bf1ac6aa"},
-    {file = "watchfiles-0.21.0-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:c81818595eff6e92535ff32825f31c116f867f64ff8cdf6562cd1d6b2e1e8f3e"},
-    {file = "watchfiles-0.21.0-cp310-cp310-manylinux_2_12_i686.manylinux2010_i686.whl", hash = "sha256:6c107ea3cf2bd07199d66f156e3ea756d1b84dfd43b542b2d870b77868c98c03"},
-    {file = "watchfiles-0.21.0-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:0d9ac347653ebd95839a7c607608703b20bc07e577e870d824fa4801bc1cb124"},
-    {file = "watchfiles-0.21.0-cp310-cp310-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:5eb86c6acb498208e7663ca22dbe68ca2cf42ab5bf1c776670a50919a56e64ab"},
-    {file = "watchfiles-0.21.0-cp310-cp310-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:f564bf68404144ea6b87a78a3f910cc8de216c6b12a4cf0b27718bf4ec38d303"},
-    {file = "watchfiles-0.21.0-cp310-cp310-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:3d0f32ebfaa9c6011f8454994f86108c2eb9c79b8b7de00b36d558cadcedaa3d"},
-    {file = "watchfiles-0.21.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:b6d45d9b699ecbac6c7bd8e0a2609767491540403610962968d258fd6405c17c"},
-    {file = "watchfiles-0.21.0-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:aff06b2cac3ef4616e26ba17a9c250c1fe9dd8a5d907d0193f84c499b1b6e6a9"},
-    {file = "watchfiles-0.21.0-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:d9792dff410f266051025ecfaa927078b94cc7478954b06796a9756ccc7e14a9"},
-    {file = "watchfiles-0.21.0-cp310-none-win32.whl", hash = "sha256:214cee7f9e09150d4fb42e24919a1e74d8c9b8a9306ed1474ecaddcd5479c293"},
-    {file = "watchfiles-0.21.0-cp310-none-win_amd64.whl", hash = "sha256:1ad7247d79f9f55bb25ab1778fd47f32d70cf36053941f07de0b7c4e96b5d235"},
-    {file = "watchfiles-0.21.0-cp311-cp311-macosx_10_7_x86_64.whl", hash = "sha256:668c265d90de8ae914f860d3eeb164534ba2e836811f91fecc7050416ee70aa7"},
-    {file = "watchfiles-0.21.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:3a23092a992e61c3a6a70f350a56db7197242f3490da9c87b500f389b2d01eef"},
-    {file = "watchfiles-0.21.0-cp311-cp311-manylinux_2_12_i686.manylinux2010_i686.whl", hash = "sha256:e7941bbcfdded9c26b0bf720cb7e6fd803d95a55d2c14b4bd1f6a2772230c586"},
-    {file = "watchfiles-0.21.0-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:11cd0c3100e2233e9c53106265da31d574355c288e15259c0d40a4405cbae317"},
-    {file = "watchfiles-0.21.0-cp311-cp311-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:d78f30cbe8b2ce770160d3c08cff01b2ae9306fe66ce899b73f0409dc1846c1b"},
-    {file = "watchfiles-0.21.0-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:6674b00b9756b0af620aa2a3346b01f8e2a3dc729d25617e1b89cf6af4a54eb1"},
-    {file = "watchfiles-0.21.0-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:fd7ac678b92b29ba630d8c842d8ad6c555abda1b9ef044d6cc092dacbfc9719d"},
-    {file = "watchfiles-0.21.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:9c873345680c1b87f1e09e0eaf8cf6c891b9851d8b4d3645e7efe2ec20a20cc7"},
-    {file = "watchfiles-0.21.0-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:49f56e6ecc2503e7dbe233fa328b2be1a7797d31548e7a193237dcdf1ad0eee0"},
-    {file = "watchfiles-0.21.0-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:02d91cbac553a3ad141db016e3350b03184deaafeba09b9d6439826ee594b365"},
-    {file = "watchfiles-0.21.0-cp311-none-win32.whl", hash = "sha256:ebe684d7d26239e23d102a2bad2a358dedf18e462e8808778703427d1f584400"},
-    {file = "watchfiles-0.21.0-cp311-none-win_amd64.whl", hash = "sha256:4566006aa44cb0d21b8ab53baf4b9c667a0ed23efe4aaad8c227bfba0bf15cbe"},
-    {file = "watchfiles-0.21.0-cp311-none-win_arm64.whl", hash = "sha256:c550a56bf209a3d987d5a975cdf2063b3389a5d16caf29db4bdddeae49f22078"},
-    {file = "watchfiles-0.21.0-cp312-cp312-macosx_10_7_x86_64.whl", hash = "sha256:51ddac60b96a42c15d24fbdc7a4bfcd02b5a29c047b7f8bf63d3f6f5a860949a"},
-    {file = "watchfiles-0.21.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:511f0b034120cd1989932bf1e9081aa9fb00f1f949fbd2d9cab6264916ae89b1"},
-    {file = "watchfiles-0.21.0-cp312-cp312-manylinux_2_12_i686.manylinux2010_i686.whl", hash = "sha256:cfb92d49dbb95ec7a07511bc9efb0faff8fe24ef3805662b8d6808ba8409a71a"},
-    {file = "watchfiles-0.21.0-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:3f92944efc564867bbf841c823c8b71bb0be75e06b8ce45c084b46411475a915"},
-    {file = "watchfiles-0.21.0-cp312-cp312-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:642d66b75eda909fd1112d35c53816d59789a4b38c141a96d62f50a3ef9b3360"},
-    {file = "watchfiles-0.21.0-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:d23bcd6c8eaa6324fe109d8cac01b41fe9a54b8c498af9ce464c1aeeb99903d6"},
-    {file = "watchfiles-0.21.0-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:18d5b4da8cf3e41895b34e8c37d13c9ed294954907929aacd95153508d5d89d7"},
-    {file = "watchfiles-0.21.0-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1b8d1eae0f65441963d805f766c7e9cd092f91e0c600c820c764a4ff71a0764c"},
-    {file = "watchfiles-0.21.0-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:1fd9a5205139f3c6bb60d11f6072e0552f0a20b712c85f43d42342d162be1235"},
-    {file = "watchfiles-0.21.0-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:a1e3014a625bcf107fbf38eece0e47fa0190e52e45dc6eee5a8265ddc6dc5ea7"},
-    {file = "watchfiles-0.21.0-cp312-none-win32.whl", hash = "sha256:9d09869f2c5a6f2d9df50ce3064b3391d3ecb6dced708ad64467b9e4f2c9bef3"},
-    {file = "watchfiles-0.21.0-cp312-none-win_amd64.whl", hash = "sha256:18722b50783b5e30a18a8a5db3006bab146d2b705c92eb9a94f78c72beb94094"},
-    {file = "watchfiles-0.21.0-cp312-none-win_arm64.whl", hash = "sha256:a3b9bec9579a15fb3ca2d9878deae789df72f2b0fdaf90ad49ee389cad5edab6"},
-    {file = "watchfiles-0.21.0-cp38-cp38-macosx_10_7_x86_64.whl", hash = "sha256:4ea10a29aa5de67de02256a28d1bf53d21322295cb00bd2d57fcd19b850ebd99"},
-    {file = "watchfiles-0.21.0-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:40bca549fdc929b470dd1dbfcb47b3295cb46a6d2c90e50588b0a1b3bd98f429"},
-    {file = "watchfiles-0.21.0-cp38-cp38-manylinux_2_12_i686.manylinux2010_i686.whl", hash = "sha256:9b37a7ba223b2f26122c148bb8d09a9ff312afca998c48c725ff5a0a632145f7"},
-    {file = "watchfiles-0.21.0-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ec8c8900dc5c83650a63dd48c4d1d245343f904c4b64b48798c67a3767d7e165"},
-    {file = "watchfiles-0.21.0-cp38-cp38-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:8ad3fe0a3567c2f0f629d800409cd528cb6251da12e81a1f765e5c5345fd0137"},
-    {file = "watchfiles-0.21.0-cp38-cp38-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:9d353c4cfda586db2a176ce42c88f2fc31ec25e50212650c89fdd0f560ee507b"},
-    {file = "watchfiles-0.21.0-cp38-cp38-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:83a696da8922314ff2aec02987eefb03784f473281d740bf9170181829133765"},
-    {file = "watchfiles-0.21.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:5a03651352fc20975ee2a707cd2d74a386cd303cc688f407296064ad1e6d1562"},
-    {file = "watchfiles-0.21.0-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:3ad692bc7792be8c32918c699638b660c0de078a6cbe464c46e1340dadb94c19"},
-    {file = "watchfiles-0.21.0-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:06247538e8253975bdb328e7683f8515ff5ff041f43be6c40bff62d989b7d0b0"},
-    {file = "watchfiles-0.21.0-cp38-none-win32.whl", hash = "sha256:9a0aa47f94ea9a0b39dd30850b0adf2e1cd32a8b4f9c7aa443d852aacf9ca214"},
-    {file = "watchfiles-0.21.0-cp38-none-win_amd64.whl", hash = "sha256:8d5f400326840934e3507701f9f7269247f7c026d1b6cfd49477d2be0933cfca"},
-    {file = "watchfiles-0.21.0-cp39-cp39-macosx_10_7_x86_64.whl", hash = "sha256:7f762a1a85a12cc3484f77eee7be87b10f8c50b0b787bb02f4e357403cad0c0e"},
-    {file = "watchfiles-0.21.0-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:6e9be3ef84e2bb9710f3f777accce25556f4a71e15d2b73223788d528fcc2052"},
-    {file = "watchfiles-0.21.0-cp39-cp39-manylinux_2_12_i686.manylinux2010_i686.whl", hash = "sha256:4c48a10d17571d1275701e14a601e36959ffada3add8cdbc9e5061a6e3579a5d"},
-    {file = "watchfiles-0.21.0-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:6c889025f59884423428c261f212e04d438de865beda0b1e1babab85ef4c0f01"},
-    {file = "watchfiles-0.21.0-cp39-cp39-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:66fac0c238ab9a2e72d026b5fb91cb902c146202bbd29a9a1a44e8db7b710b6f"},
-    {file = "watchfiles-0.21.0-cp39-cp39-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:b4a21f71885aa2744719459951819e7bf5a906a6448a6b2bbce8e9cc9f2c8128"},
-    {file = "watchfiles-0.21.0-cp39-cp39-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:1c9198c989f47898b2c22201756f73249de3748e0fc9de44adaf54a8b259cc0c"},
-    {file = "watchfiles-0.21.0-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d8f57c4461cd24fda22493109c45b3980863c58a25b8bec885ca8bea6b8d4b28"},
-    {file = "watchfiles-0.21.0-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:853853cbf7bf9408b404754b92512ebe3e3a83587503d766d23e6bf83d092ee6"},
-    {file = "watchfiles-0.21.0-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:d5b1dc0e708fad9f92c296ab2f948af403bf201db8fb2eb4c8179db143732e49"},
-    {file = "watchfiles-0.21.0-cp39-none-win32.whl", hash = "sha256:59137c0c6826bd56c710d1d2bda81553b5e6b7c84d5a676747d80caf0409ad94"},
-    {file = "watchfiles-0.21.0-cp39-none-win_amd64.whl", hash = "sha256:6cb8fdc044909e2078c248986f2fc76f911f72b51ea4a4fbbf472e01d14faa58"},
-    {file = "watchfiles-0.21.0-pp310-pypy310_pp73-macosx_10_7_x86_64.whl", hash = "sha256:ab03a90b305d2588e8352168e8c5a1520b721d2d367f31e9332c4235b30b8994"},
-    {file = "watchfiles-0.21.0-pp310-pypy310_pp73-macosx_11_0_arm64.whl", hash = "sha256:927c589500f9f41e370b0125c12ac9e7d3a2fd166b89e9ee2828b3dda20bfe6f"},
-    {file = "watchfiles-0.21.0-pp310-pypy310_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:1bd467213195e76f838caf2c28cd65e58302d0254e636e7c0fca81efa4a2e62c"},
-    {file = "watchfiles-0.21.0-pp310-pypy310_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:02b73130687bc3f6bb79d8a170959042eb56eb3a42df3671c79b428cd73f17cc"},
-    {file = "watchfiles-0.21.0-pp38-pypy38_pp73-macosx_10_7_x86_64.whl", hash = "sha256:08dca260e85ffae975448e344834d765983237ad6dc308231aa16e7933db763e"},
-    {file = "watchfiles-0.21.0-pp38-pypy38_pp73-macosx_11_0_arm64.whl", hash = "sha256:3ccceb50c611c433145502735e0370877cced72a6c70fd2410238bcbc7fe51d8"},
-    {file = "watchfiles-0.21.0-pp38-pypy38_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:57d430f5fb63fea141ab71ca9c064e80de3a20b427ca2febcbfcef70ff0ce895"},
-    {file = "watchfiles-0.21.0-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:0dd5fad9b9c0dd89904bbdea978ce89a2b692a7ee8a0ce19b940e538c88a809c"},
-    {file = "watchfiles-0.21.0-pp39-pypy39_pp73-macosx_10_7_x86_64.whl", hash = "sha256:be6dd5d52b73018b21adc1c5d28ac0c68184a64769052dfeb0c5d9998e7f56a2"},
-    {file = "watchfiles-0.21.0-pp39-pypy39_pp73-macosx_11_0_arm64.whl", hash = "sha256:b3cab0e06143768499384a8a5efb9c4dc53e19382952859e4802f294214f36ec"},
-    {file = "watchfiles-0.21.0-pp39-pypy39_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:8c6ed10c2497e5fedadf61e465b3ca12a19f96004c15dcffe4bd442ebadc2d85"},
-    {file = "watchfiles-0.21.0-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:43babacef21c519bc6631c5fce2a61eccdfc011b4bcb9047255e9620732c8097"},
-    {file = "watchfiles-0.21.0.tar.gz", hash = "sha256:c76c635fabf542bb78524905718c39f736a98e5ab25b23ec6d4abede1a85a6a3"},
+    {file = "watchfiles-0.22.0-cp310-cp310-macosx_10_12_x86_64.whl", hash = "sha256:da1e0a8caebf17976e2ffd00fa15f258e14749db5e014660f53114b676e68538"},
+    {file = "watchfiles-0.22.0-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:61af9efa0733dc4ca462347becb82e8ef4945aba5135b1638bfc20fad64d4f0e"},
+    {file = "watchfiles-0.22.0-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:1d9188979a58a096b6f8090e816ccc3f255f137a009dd4bbec628e27696d67c1"},
+    {file = "watchfiles-0.22.0-cp310-cp310-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:2bdadf6b90c099ca079d468f976fd50062905d61fae183f769637cb0f68ba59a"},
+    {file = "watchfiles-0.22.0-cp310-cp310-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:067dea90c43bf837d41e72e546196e674f68c23702d3ef80e4e816937b0a3ffd"},
+    {file = "watchfiles-0.22.0-cp310-cp310-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:bbf8a20266136507abf88b0df2328e6a9a7c7309e8daff124dda3803306a9fdb"},
+    {file = "watchfiles-0.22.0-cp310-cp310-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:1235c11510ea557fe21be5d0e354bae2c655a8ee6519c94617fe63e05bca4171"},
+    {file = "watchfiles-0.22.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:c2444dc7cb9d8cc5ab88ebe792a8d75709d96eeef47f4c8fccb6df7c7bc5be71"},
+    {file = "watchfiles-0.22.0-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:c5af2347d17ab0bd59366db8752d9e037982e259cacb2ba06f2c41c08af02c39"},
+    {file = "watchfiles-0.22.0-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:9624a68b96c878c10437199d9a8b7d7e542feddda8d5ecff58fdc8e67b460848"},
+    {file = "watchfiles-0.22.0-cp310-none-win32.whl", hash = "sha256:4b9f2a128a32a2c273d63eb1fdbf49ad64852fc38d15b34eaa3f7ca2f0d2b797"},
+    {file = "watchfiles-0.22.0-cp310-none-win_amd64.whl", hash = "sha256:2627a91e8110b8de2406d8b2474427c86f5a62bf7d9ab3654f541f319ef22bcb"},
+    {file = "watchfiles-0.22.0-cp311-cp311-macosx_10_12_x86_64.whl", hash = "sha256:8c39987a1397a877217be1ac0fb1d8b9f662c6077b90ff3de2c05f235e6a8f96"},
+    {file = "watchfiles-0.22.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:a927b3034d0672f62fb2ef7ea3c9fc76d063c4b15ea852d1db2dc75fe2c09696"},
+    {file = "watchfiles-0.22.0-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:052d668a167e9fc345c24203b104c313c86654dd6c0feb4b8a6dfc2462239249"},
+    {file = "watchfiles-0.22.0-cp311-cp311-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:5e45fb0d70dda1623a7045bd00c9e036e6f1f6a85e4ef2c8ae602b1dfadf7550"},
+    {file = "watchfiles-0.22.0-cp311-cp311-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:c49b76a78c156979759d759339fb62eb0549515acfe4fd18bb151cc07366629c"},
+    {file = "watchfiles-0.22.0-cp311-cp311-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:c4a65474fd2b4c63e2c18ac67a0c6c66b82f4e73e2e4d940f837ed3d2fd9d4da"},
+    {file = "watchfiles-0.22.0-cp311-cp311-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:1cc0cba54f47c660d9fa3218158b8963c517ed23bd9f45fe463f08262a4adae1"},
+    {file = "watchfiles-0.22.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:94ebe84a035993bb7668f58a0ebf998174fb723a39e4ef9fce95baabb42b787f"},
+    {file = "watchfiles-0.22.0-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:e0f0a874231e2839abbf473256efffe577d6ee2e3bfa5b540479e892e47c172d"},
+    {file = "watchfiles-0.22.0-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:213792c2cd3150b903e6e7884d40660e0bcec4465e00563a5fc03f30ea9c166c"},
+    {file = "watchfiles-0.22.0-cp311-none-win32.whl", hash = "sha256:b44b70850f0073b5fcc0b31ede8b4e736860d70e2dbf55701e05d3227a154a67"},
+    {file = "watchfiles-0.22.0-cp311-none-win_amd64.whl", hash = "sha256:00f39592cdd124b4ec5ed0b1edfae091567c72c7da1487ae645426d1b0ffcad1"},
+    {file = "watchfiles-0.22.0-cp311-none-win_arm64.whl", hash = "sha256:3218a6f908f6a276941422b035b511b6d0d8328edd89a53ae8c65be139073f84"},
+    {file = "watchfiles-0.22.0-cp312-cp312-macosx_10_12_x86_64.whl", hash = "sha256:c7b978c384e29d6c7372209cbf421d82286a807bbcdeb315427687f8371c340a"},
+    {file = "watchfiles-0.22.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:bd4c06100bce70a20c4b81e599e5886cf504c9532951df65ad1133e508bf20be"},
+    {file = "watchfiles-0.22.0-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:425440e55cd735386ec7925f64d5dde392e69979d4c8459f6bb4e920210407f2"},
+    {file = "watchfiles-0.22.0-cp312-cp312-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:68fe0c4d22332d7ce53ad094622b27e67440dacefbaedd29e0794d26e247280c"},
+    {file = "watchfiles-0.22.0-cp312-cp312-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:a8a31bfd98f846c3c284ba694c6365620b637debdd36e46e1859c897123aa232"},
+    {file = "watchfiles-0.22.0-cp312-cp312-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:dc2e8fe41f3cac0660197d95216c42910c2b7e9c70d48e6d84e22f577d106fc1"},
+    {file = "watchfiles-0.22.0-cp312-cp312-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:55b7cc10261c2786c41d9207193a85c1db1b725cf87936df40972aab466179b6"},
+    {file = "watchfiles-0.22.0-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:28585744c931576e535860eaf3f2c0ec7deb68e3b9c5a85ca566d69d36d8dd27"},
+    {file = "watchfiles-0.22.0-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:00095dd368f73f8f1c3a7982a9801190cc88a2f3582dd395b289294f8975172b"},
+    {file = "watchfiles-0.22.0-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:52fc9b0dbf54d43301a19b236b4a4614e610605f95e8c3f0f65c3a456ffd7d35"},
+    {file = "watchfiles-0.22.0-cp312-none-win32.whl", hash = "sha256:581f0a051ba7bafd03e17127735d92f4d286af941dacf94bcf823b101366249e"},
+    {file = "watchfiles-0.22.0-cp312-none-win_amd64.whl", hash = "sha256:aec83c3ba24c723eac14225194b862af176d52292d271c98820199110e31141e"},
+    {file = "watchfiles-0.22.0-cp312-none-win_arm64.whl", hash = "sha256:c668228833c5619f6618699a2c12be057711b0ea6396aeaece4ded94184304ea"},
+    {file = "watchfiles-0.22.0-cp38-cp38-macosx_10_12_x86_64.whl", hash = "sha256:d47e9ef1a94cc7a536039e46738e17cce058ac1593b2eccdede8bf72e45f372a"},
+    {file = "watchfiles-0.22.0-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:28f393c1194b6eaadcdd8f941307fc9bbd7eb567995232c830f6aef38e8a6e88"},
+    {file = "watchfiles-0.22.0-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:dd64f3a4db121bc161644c9e10a9acdb836853155a108c2446db2f5ae1778c3d"},
+    {file = "watchfiles-0.22.0-cp38-cp38-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:2abeb79209630da981f8ebca30a2c84b4c3516a214451bfc5f106723c5f45843"},
+    {file = "watchfiles-0.22.0-cp38-cp38-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:4cc382083afba7918e32d5ef12321421ef43d685b9a67cc452a6e6e18920890e"},
+    {file = "watchfiles-0.22.0-cp38-cp38-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:d048ad5d25b363ba1d19f92dcf29023988524bee6f9d952130b316c5802069cb"},
+    {file = "watchfiles-0.22.0-cp38-cp38-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:103622865599f8082f03af4214eaff90e2426edff5e8522c8f9e93dc17caee13"},
+    {file = "watchfiles-0.22.0-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d3e1f3cf81f1f823e7874ae563457828e940d75573c8fbf0ee66818c8b6a9099"},
+    {file = "watchfiles-0.22.0-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:8597b6f9dc410bdafc8bb362dac1cbc9b4684a8310e16b1ff5eee8725d13dcd6"},
+    {file = "watchfiles-0.22.0-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:0b04a2cbc30e110303baa6d3ddce8ca3664bc3403be0f0ad513d1843a41c97d1"},
+    {file = "watchfiles-0.22.0-cp38-none-win32.whl", hash = "sha256:b610fb5e27825b570554d01cec427b6620ce9bd21ff8ab775fc3a32f28bba63e"},
+    {file = "watchfiles-0.22.0-cp38-none-win_amd64.whl", hash = "sha256:fe82d13461418ca5e5a808a9e40f79c1879351fcaeddbede094028e74d836e86"},
+    {file = "watchfiles-0.22.0-cp39-cp39-macosx_10_12_x86_64.whl", hash = "sha256:3973145235a38f73c61474d56ad6199124e7488822f3a4fc97c72009751ae3b0"},
+    {file = "watchfiles-0.22.0-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:280a4afbc607cdfc9571b9904b03a478fc9f08bbeec382d648181c695648202f"},
+    {file = "watchfiles-0.22.0-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:3a0d883351a34c01bd53cfa75cd0292e3f7e268bacf2f9e33af4ecede7e21d1d"},
+    {file = "watchfiles-0.22.0-cp39-cp39-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:9165bcab15f2b6d90eedc5c20a7f8a03156b3773e5fb06a790b54ccecdb73385"},
+    {file = "watchfiles-0.22.0-cp39-cp39-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:dc1b9b56f051209be458b87edb6856a449ad3f803315d87b2da4c93b43a6fe72"},
+    {file = "watchfiles-0.22.0-cp39-cp39-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:8dc1fc25a1dedf2dd952909c8e5cb210791e5f2d9bc5e0e8ebc28dd42fed7562"},
+    {file = "watchfiles-0.22.0-cp39-cp39-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:dc92d2d2706d2b862ce0568b24987eba51e17e14b79a1abcd2edc39e48e743c8"},
+    {file = "watchfiles-0.22.0-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:97b94e14b88409c58cdf4a8eaf0e67dfd3ece7e9ce7140ea6ff48b0407a593ec"},
+    {file = "watchfiles-0.22.0-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:96eec15e5ea7c0b6eb5bfffe990fc7c6bd833acf7e26704eb18387fb2f5fd087"},
+    {file = "watchfiles-0.22.0-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:28324d6b28bcb8d7c1041648d7b63be07a16db5510bea923fc80b91a2a6cbed6"},
+    {file = "watchfiles-0.22.0-cp39-none-win32.whl", hash = "sha256:8c3e3675e6e39dc59b8fe5c914a19d30029e36e9f99468dddffd432d8a7b1c93"},
+    {file = "watchfiles-0.22.0-cp39-none-win_amd64.whl", hash = "sha256:25c817ff2a86bc3de3ed2df1703e3d24ce03479b27bb4527c57e722f8554d971"},
+    {file = "watchfiles-0.22.0-pp310-pypy310_pp73-macosx_10_12_x86_64.whl", hash = "sha256:b810a2c7878cbdecca12feae2c2ae8af59bea016a78bc353c184fa1e09f76b68"},
+    {file = "watchfiles-0.22.0-pp310-pypy310_pp73-macosx_11_0_arm64.whl", hash = "sha256:f7e1f9c5d1160d03b93fc4b68a0aeb82fe25563e12fbcdc8507f8434ab6f823c"},
+    {file = "watchfiles-0.22.0-pp310-pypy310_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:030bc4e68d14bcad2294ff68c1ed87215fbd9a10d9dea74e7cfe8a17869785ab"},
+    {file = "watchfiles-0.22.0-pp310-pypy310_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:ace7d060432acde5532e26863e897ee684780337afb775107c0a90ae8dbccfd2"},
+    {file = "watchfiles-0.22.0-pp38-pypy38_pp73-macosx_10_12_x86_64.whl", hash = "sha256:5834e1f8b71476a26df97d121c0c0ed3549d869124ed2433e02491553cb468c2"},
+    {file = "watchfiles-0.22.0-pp38-pypy38_pp73-macosx_11_0_arm64.whl", hash = "sha256:0bc3b2f93a140df6806c8467c7f51ed5e55a931b031b5c2d7ff6132292e803d6"},
+    {file = "watchfiles-0.22.0-pp38-pypy38_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:8fdebb655bb1ba0122402352b0a4254812717a017d2dc49372a1d47e24073795"},
+    {file = "watchfiles-0.22.0-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:0c8e0aa0e8cc2a43561e0184c0513e291ca891db13a269d8d47cb9841ced7c71"},
+    {file = "watchfiles-0.22.0-pp39-pypy39_pp73-macosx_10_12_x86_64.whl", hash = "sha256:2f350cbaa4bb812314af5dab0eb8d538481e2e2279472890864547f3fe2281ed"},
+    {file = "watchfiles-0.22.0-pp39-pypy39_pp73-macosx_11_0_arm64.whl", hash = "sha256:7a74436c415843af2a769b36bf043b6ccbc0f8d784814ba3d42fc961cdb0a9dc"},
+    {file = "watchfiles-0.22.0-pp39-pypy39_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:00ad0bcd399503a84cc688590cdffbe7a991691314dde5b57b3ed50a41319a31"},
+    {file = "watchfiles-0.22.0-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:72a44e9481afc7a5ee3291b09c419abab93b7e9c306c9ef9108cb76728ca58d2"},
+    {file = "watchfiles-0.22.0.tar.gz", hash = "sha256:988e981aaab4f3955209e7e28c7794acdb690be1efa7f16f8ea5aba7ffdadacb"},
 ]
 
 [package.dependencies]
@@ -915,4 +1078,4 @@ files = [
 [metadata]
 lock-version = "2.0"
 python-versions = ">=3.9,<4.0"
-content-hash = "bada9554d3318a11886e1e0e6d3f020beafe8e4c6db8b9249b3b38fcb6c31ef0"
+content-hash = "3c590a15090c198deed5d89a50dd4bd096f263a7efbb8ae65d07354320668cc9"

From aed443055b6b1701cdb107dc11a2c8929c90ebec Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Thu, 30 May 2024 09:04:37 -0500
Subject: [PATCH 23/29] Update CHANGELOG.md

---
 CHANGELOG.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index ef1f28f..ed47066 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -2,10 +2,11 @@
 
 ## v0.3.0
 
-**Release date:**
+**Release date: 05/30/2024**
 
  - Added ability to query the CLASTR API for single or batch queries from within the STRprofiler 
  app - [#24](https://github.com/j-andrews7/strprofiler/pull/24).
+ - Numerous UI tweaks for a more compact experience.
 
 ## v0.2.0
 

From 9dd839d208ab5af4e4dc9253fb6bfa7fac334242 Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Thu, 30 May 2024 09:06:49 -0500
Subject: [PATCH 24/29] Remove old paper drafts and JOSS workflow

---
 .github/workflows/draft-pdf.yml |  23 -------
 paper.bib                       | 112 --------------------------------
 paper.md                        |  81 -----------------------
 3 files changed, 216 deletions(-)
 delete mode 100644 .github/workflows/draft-pdf.yml
 delete mode 100644 paper.bib
 delete mode 100644 paper.md

diff --git a/.github/workflows/draft-pdf.yml b/.github/workflows/draft-pdf.yml
deleted file mode 100644
index 61ae864..0000000
--- a/.github/workflows/draft-pdf.yml
+++ /dev/null
@@ -1,23 +0,0 @@
-on: [push]
-
-jobs:
-  paper:
-    runs-on: ubuntu-latest
-    name: Paper Draft
-    steps:
-      - name: Checkout
-        uses: actions/checkout@v2
-      - name: Build draft PDF
-        uses: openjournals/openjournals-draft-action@master
-        with:
-          journal: joss
-          # This should be the path to the paper within your repo.
-          paper-path: paper.md
-      - name: Upload
-        uses: actions/upload-artifact@v1
-        with:
-          name: paper
-          # This is the output path where Pandoc will write the compiled
-          # PDF. Note, this should be the same directory as the input
-          # paper.md
-          path: paper.pdf
\ No newline at end of file
diff --git a/paper.bib b/paper.bib
deleted file mode 100644
index 5dd556e..0000000
--- a/paper.bib
+++ /dev/null
@@ -1,112 +0,0 @@
-@article{atcc,
-  title = {Cell Line Misidentification: The Beginning of the End},
-  shorttitle = {Cell Line Misidentification},
-  author = {{American Type Culture Collection Standards Development Organization Workgroup ASN-0002}},
-  year = {2010},
-  month = jun,
-  journal = {Nature Reviews Cancer},
-  volume = {10},
-  number = {6},
-  pages = {441--448},
-  publisher = {{Nature Publishing Group}},
-  issn = {1474-1768},
-  doi = {10.1038/nrc2852},
-  abstract = {That a substantial proportion of cell lines is mislabelled or replaced by cells derived from a different individual, tissue or species has been a long known, but largely ignored problem. The history of cell line misidentification and recent efforts to develop a standard for the authentication of human cell lines using short tandem repeat profiling is discussed in this article.},
-  copyright = {2010 Nature Publishing Group},
-  langid = {english},
-  keywords = {Cancer models,Genetic techniques}
-}
-
-@article{capes-davis,
-  title = {Check Your Cultures! {{A}} List of Cross-Contaminated or Misidentified Cell Lines},
-  author = {{Capes-Davis}, Amanda and Theodosopoulos, George and Atkin, Isobel and Drexler, Hans G. and Kohara, Arihiro and MacLeod, Roderick A.F. and Masters, John R. and Nakamura, Yukio and Reid, Yvonne A. and Reddel, Roger R. and Freshney, R. Ian},
-  year = {2010},
-  journal = {International Journal of Cancer},
-  volume = {127},
-  number = {1},
-  pages = {1--8},
-  issn = {1097-0215},
-  doi = {10.1002/ijc.25242},
-  abstract = {Continuous cell lines consist of cultured cells derived from a specific donor and tissue of origin that have acquired the ability to proliferate indefinitely. These cell lines are well-recognized models for the study of health and disease, particularly for cancer. However, there are cautions to be aware of when using continuous cell lines, including the possibility of contamination, in which a foreign cell line or microorganism is introduced without the handler's knowledge. Cross-contamination, in which the contaminant is another cell line, was first recognized in the 1950s but, disturbingly, remains a serious issue today. Many cell lines become cross-contaminated early, so that subsequent experimental work has been performed only on the contaminant, masquerading under a different name. What can be done in response\textemdash how can a researcher know if their own cell lines are cross-contaminated? Two practical responses are suggested here. First, it is important to check the literature, looking for previous work on cross-contamination. Some reports may be difficult to find and to make these more accessible, we have compiled a list of known cross-contaminated cell lines. The list currently contains 360 cell lines, drawn from 68 references. Most contaminants arise within the same species, with HeLa still the most frequently encountered (29\%, 106/360) among human cell lines, but interspecies contaminants account for a small but substantial minority of cases (9\%, 33/360). Second, even if there are no previous publications on cross-contamination for that cell line, it is essential to check the sample itself by performing authentication testing.},
-  langid = {english},
-  keywords = {authentication,cell culture,cell lines,cross-contamination,DNA profiling,misidentification},
-  annotation = {\_eprint: https://onlinelibrary.wiley.com/doi/pdf/10.1002/ijc.25242}
-}
-
-@article{capes-davisMatchCriteria,
-  title = {Match Criteria for Human Cell Line Authentication: {{Where}} Do We Draw the Line?},
-  shorttitle = {Match Criteria for Human Cell Line Authentication},
-  author = {{Capes-Davis}, Amanda and Reid, Yvonne A. and Kline, Margaret C. and Storts, Douglas R. and Strauss, Ethan and Dirks, Wilhelm G. and Drexler, Hans G. and MacLeod, Roderick A.F. and Sykes, Gregory and Kohara, Arihiro and Nakamura, Yukio and Elmore, Eugene and Nims, Raymond W. and {Alston-Roberts}, Christine and Barallon, Rita and Los, Georgyi V. and Nardone, Roland M. and Price, Paul J. and Steuer, Anton and Thomson, Jim and Masters, John R.W. and Kerrigan, Liz},
-  year = {2013},
-  journal = {International Journal of Cancer},
-  volume = {132},
-  number = {11},
-  pages = {2510--2519},
-  issn = {1097-0215},
-  doi = {10.1002/ijc.27931},
-  abstract = {Continuous human cell lines have been used extensively as models for biomedical research. In working with these cell lines, researchers are often unaware of the risk of cross-contamination and other causes of misidentification. To reduce this risk, there is a pressing need to authenticate cell lines, comparing the sample handled in the laboratory to a previously tested sample. The American Type Culture Collection Standards Development Organization Workgroup ASN-0002 has developed a Standard for human cell line authentication, recommending short tandem repeat (STR) profiling for authentication of human cell lines. However, there are known limitations to the technique when applied to cultured samples, including possible genetic drift with passage. In our study, a dataset of 2,279 STR profiles from four cell banks was used to assess the effectiveness of the match criteria recommended within the Standard. Of these 2,279 STR profiles, 1,157 were grouped into sets of related cell lines\textemdash duplicate holdings, legitimately related samples or misidentified cell lines. Eight core STR loci plus amelogenin were used to unequivocally authenticate 98\% of these related sets. Two simple match algorithms each clearly discriminated between related and unrelated samples, with separation between related samples at {$\geq$}80\% match and unrelated samples at {$<$}50\% match. A small degree of overlap was noted at 50\textendash 79\% match, mostly from cell lines known to display variable STR profiles. These match criteria are recommended as a simple and effective way to interpret results from STR profiling of human cell lines.},
-  langid = {english},
-  keywords = {authentication,cross-contamination,human cell lines,match criteria,STR profiling},
-  annotation = {\_eprint: https://onlinelibrary.wiley.com/doi/pdf/10.1002/ijc.27931}
-}
-
-@article{lynchSimilarity,
-  title = {The Similarity Index and {{DNA}} Fingerprinting},
-  author = {Lynch, M.},
-  year = {1990},
-  month = sep,
-  journal = {Molecular Biology and Evolution},
-  volume = {7},
-  number = {5},
-  pages = {478--484},
-  issn = {0737-4038},
-  doi = {10.1093/oxfordjournals.molbev.a040620},
-  abstract = {DNA-fingerprint similarity is being used increasingly to make inferences about levels of genetic variation within and between natural populations. It is shown that the similarity index--the average fraction of shared restriction fragments--provides upwardly biased estimates of population homozygosity but nearly unbiased estimates of the average identity-in-state for random pairs of individuals. A method is suggested for partitioning the DNA-fingerprint dissimilarity into within- and between-population components. Some simple expressions are given for the sampling variances of these estimators.},
-  langid = {english},
-  pmid = {2263197},
-  keywords = {Alleles,Biological Evolution,DNA,DNA Fingerprinting,Genetic Markers,Homozygote}
-}
-
-@article{masters,
-  title = {Short Tandem Repeat Profiling Provides an International Reference Standard for Human Cell Lines},
-  author = {Masters, John R. and Thomson, Jim A. and {Daly-Burns}, Bernadette and Reid, Yvonne A. and Dirks, Wilhelm G. and Packer, Phil and Toji, Lorraine H. and Ohno, Tadao and Tanabe, Hideyuki and Arlett, Colin F. and Kelland, Lloyd R. and Harrison, Maureen and Virmani, Arvind and Ward, Timothy H. and Ayres, Karen L. and Debenham, Paul G.},
-  year = {2001},
-  month = jul,
-  journal = {Proceedings of the National Academy of Sciences},
-  volume = {98},
-  number = {14},
-  pages = {8012--8017},
-  publisher = {{Proceedings of the National Academy of Sciences}},
-  doi = {10.1073/pnas.121616198}
-}
-
-@article{CLASTR,
-  title = {{{CLASTR}}: {{The Cellosaurus STR}} Similarity Search Tool - {{A}} Precious Help for Cell Line Authentication},
-  shorttitle = {{{CLASTR}}},
-  author = {Robin, Thibault and {Capes-Davis}, Amanda and Bairoch, Amos},
-  year = {2020},
-  journal = {International Journal of Cancer},
-  volume = {146},
-  number = {5},
-  pages = {1299--1306},
-  issn = {1097-0215},
-  doi = {10.1002/ijc.32639},
-  abstract = {Despite an increased awareness of the problematic of cell line cross-contamination and misidentification, it remains nowadays a major source of erroneous experimental results in biomedical research. To prevent it, researchers are expected to frequently test the authenticity of the cell lines they are working on. STR profiling was selected as the international reference method to perform cell line authentication. While the experimental protocols and manipulations for generating a STR profile are well described, the available tools and workflows to analyze such data are lacking. The Cellosaurus knowledge resource aimed to improve the situation by compiling all the publicly available STR profiles from the literature and other databases. As a result, it grew to become the largest database in terms of human STR profiles, with 6,474 distinct cell lines having an associated STR profile (release July 31, 2019). Here we present CLASTR, the Cellosaurus STR similarity search tool enabling users to compare one or more STR profiles with those available in the Cellosaurus cell line knowledge resource. It aims to help researchers in the process of cell line authentication by providing numerous functionalities. The tool is publicly accessible on the SIB ExPASy server (https://web.expasy.org/cellosaurus-str-search) and its source code is available on GitHub under the GPL-3.0 license.},
-  langid = {english},
-  keywords = {authentication,cell culture,cell lines,contamination,misidentification,STR profiling},
-  annotation = {\_eprint: https://onlinelibrary.wiley.com/doi/pdf/10.1002/ijc.32639}
-}
-
-@article{tanabe,
-  title = {Cell {{Line Individualization}} by {{Str Multiplex System}} in the {{Cell Bank Found Cross-Contamination Between Ecv304}} and {{Ej-1}}/{{T24}}},
-  author = {Tanabe, Hideyuki and Takada, Yoko and Minegishi, Daisuke and Kurematsu, Miharu and Masui, Tohru and Mizusawa, Hiroshi},
-  year = {1999},
-  journal = {組織培養研究},
-  volume = {18},
-  number = {4},
-  pages = {329--338},
-  doi = {10.11418/jtca1981.18.4_329},
-  abstract = {Short tandem repeat (STR) regions represent highly polymorphic microsatellite markers in the human gnome that have tandemly repetitive sequence elements of 2 to 7 by in length as a unit. The application of STR regions to population genetics and personal identification has been well studied. Recent technical advances have enabled us to analyze multilocus STR regions simultaneously by a method, called the STR Multiplex system, that uses a single PCR amplification in one tube. We established a new evaluation system for the identification of cell lines based on an STR Multiplex method that uses 9 different loci: D5S818, D13S317, D7S820, D16S539, vWA, TH01, Amelogenin, TPDX, and CSF1P0. The STR profiling data from 96 cell lines were examined and an efficiency of this approach for cell standardization was found. Using this method, we have analyzed the STR profiles of human cell lines, ECV304, EJ1, and 124, recently reported by the DSMZ-German Collection of Microorganisms and Cell Cultures to have been cross-contaminated. Our results clearly detect the cross-contamination between ECV304 and EJ-1/T24. The cross-contamination was estimated to be derived from the T24 cells. Collectively, the STR Multiplex system provides a rapid, precise, and powerful method in cell line identification for quality control at the JCRB Cell Bank.},
-  keywords = {Cell Bank,Cell line identification,Cross-contamination,STR Multiplex system}
-}
-
diff --git a/paper.md b/paper.md
deleted file mode 100644
index eb7c334..0000000
--- a/paper.md
+++ /dev/null
@@ -1,81 +0,0 @@
----
-title: 'strprofiler: A Python package and CLI tool for short tandem repeat profile comparisons'
-tags:
-  - python
-  - cli
-  - str profiling
-  - short tandem repeats
-  - model comparison
-  - cell line fidelity
-  - cell line authentication
-  - sample mixing
-authors:
-  - name: Jared M. Andrews
-    orcid: 0000-0002-0780-6248
-    equal-contrib: false
-    affiliation: 1 # (Multiple affiliations must be quoted)
-  - name: Suzanne J. Baker
-    equal-contrib: false # (This is how you can denote equal contributions between multiple authors)
-    affiliation: 1
-affiliations:
- - name: Department of Developmental Neurobiology, St. Jude Children's Research Hospital, USA
-   index: 1
-date: 8 November 2022
-bibliography: paper.bib
----
-
-# Summary
-
-Human cell lines have been utilized extensively for biological and pharmaceutical research, but they are at risk for cross-contamination and genetic drift over time.
-Cell line misidentification can lead to erroneous conclusions and wasted resources [@atcc; @tanabe; @capes-davis], so ensuring the authenticity of cell lines is critical for the integrity of scientific research.
-Short tandem repeat (STR) profiling is the recommended method for cell line authentication, which requres the comparison of STR profiles between a cell line and a reference sample.
-Generation of cell lines from primary tissue is expensive and time-consuming, so it is best practice for groups that generate them to serially profile them to ensure their authenticity over time.
-
-# Statement of need
-
-`strprofiler` is a Python package for comparisons of short tandem repeat (STR) profiles. 
-Profiles are frequently generated after cell line generation and throughout maintenance to authenticate their identify, identify sample mixing, and measure genetic drift during culture. 
-`strprofiler` provides a simple command line interface (CLI) for comparing STR profiles and detecting sample mixing, which can prove a time-consuming and tedious task when performed manually.
-While there exist comprehensive STR profile databases and tools, such as the [Cellusaurus STR Similarity Search Tool (CLASTR)](https://www.cellosaurus.org/str-search/) [@CLASTR], that allow comparisons to established cell lines in a low-throughput manner, these databases and tools are inadequate for research groups that generate, utilize, and maintain their own models not available through public repositories. 
-`strprofiler` allows researchers to quickly and easily compare all of their STR profiles to each other.
-
-# Usage
-
-`strprofiler` was designed to be simple to use and interpret. 
-It offers a rich CLI that takes flexible STR profile formats as input. 
-For all input STR profiles, each profile will be compared to every other profile provided and scored for similarity using the Tanabe [@tanabe], Masters (vs. query), and Masters (vs. reference) [@masters] algorithms. 
-All three have proven robust for assessing sample similarity, and an 80% similarity threshold discriminates unrelated cell lines effectively [@capes-davisMatchCriteria]. 
-By default, this is the threshold `strprofiler` uses for all algorithms to count a profile as a match. 
-In instances where samples have been previously documented as having highly variable STR profiles or known microsatellite instability, it may be appropriate for these thresholds to be lowered.
-
-`strprofiler` returns two types of output files. 
-The first is a summary file containing a record for each STR profile, its top matches with the Tanabe algorithm, all matches for each algorithm that meet the scoring threshold, and a flag for potential sample mixing based on the number of markers with 3 or more alleles detected.
-The second is a profile-specific file with that profile queried against all others. 
-This file allows for closer interrogation of samples with potential mixing.
-
-Full descriptions of input/output formats and additional parameters are available at [ReadTheDocs](https://strprofiler.readthedocs.io/en/latest/). `strprofiler` is available on [PyPI](https://pypi.org/project/strprofiler/).
-
-# Similarity Scoring Algorithms
-
-`strprofiler` utilizes three similarity scoring algorithms for comparing STR profiles:
-
- - Tanabe, also known as the Sørenson-Dice coefficient [@tanabe]:
-
-$$ score = \frac{2 * no.shared.alleles}{no.query.alleles + no.reference.alleles} $$
-
- - Masters (vs. query) [@masters]: 
-
-$$ score = \frac{no.shared.alleles}{no.query.alleles} $$
-
- - Masters (vs. reference) [@masters]: 
-
-$$ score = \frac{no.shared.alleles}{no.reference.alleles} $$
-
-The Masters algorithms are particularly useful for determining the potential contaminating samples when unintentional mixing occurs.
-
-
-# Acknowledgements
-
-We would like to acknowledge Lawryn Kasper for helpful feedback and testing of this project. We acknowledge support from the National Cancer Insitute (NCI) of the National Institutes of Health under award number P01CA096832.
-
-# References
\ No newline at end of file

From 4e940f7213d7d96c3358ebd9df569cbad8dd480f Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Thu, 30 May 2024 11:54:18 -0500
Subject: [PATCH 25/29] add version, i hate scrolling

---
 strprofiler/shiny_app/shiny_app.py | 15 +++++++++++----
 1 file changed, 11 insertions(+), 4 deletions(-)

diff --git a/strprofiler/shiny_app/shiny_app.py b/strprofiler/shiny_app/shiny_app.py
index 7654528..d7a0105 100644
--- a/strprofiler/shiny_app/shiny_app.py
+++ b/strprofiler/shiny_app/shiny_app.py
@@ -11,7 +11,9 @@
 from datetime import date
 import time
 import importlib.resources
+import importlib.metadata
 
+version = "v" + importlib.metadata.version("strprofiler")
 
 def database_load(file):
     """
@@ -131,9 +133,12 @@ def create_app(db=None):
 
     app_ui = ui.page_fluid(
         ui.panel_title("", "STR Profiler"),
-        ui.tags.style("#main {padding:12px !important} #sidebar {padding:12px}"),
+        ui.tags.style("#main {padding:12px !important} #sidebar {padding:12px} #version {padding:8px}"),
         ui.tags.style(
-            ".h3 {margin-bottom:0.1rem; line-height:1} .card-body {padding-top:6px; padding-bottom:6px}"
+            ".h3 {margin-bottom:0.1rem; line-height:1; font-size:26px} .card-body {padding-top:6px; padding-bottom:6px} .table {font-size:12px}"
+        ),
+        ui.tags.style(
+            ".hr {margin:8px 0 !important}"
         ),
         ui.page_navbar(
             shinyswatch.theme.superhero(),
@@ -240,13 +245,12 @@ def create_app(db=None):
                         ),
                     )
                 ),
-                ui.tags.hr(),
+                ui.tags.hr({"style": "margin-top:0.3rem; margin-bottom:0.5rem"}),
                 ui.card(
                     ui.row(
                         ui.column(3, ui.tags.h3("Results")),
                         ui.column(1, ui.p("")),
                     ),
-                    # TO DO: Try loading/thinking spinners.
                     ui.column(
                         12,
                         {"id": "res_card"},
@@ -488,6 +492,9 @@ def create_app(db=None):
                     target="_blank",
                 ),
             ),
+            ui.nav_control(
+                ui.span(ui.p({"id": "version"}, version))
+            ),
             title=ui.tags.a(
                 ui.tags.img(
                     src="logo.png", height="70px"

From c62eabadf3b1a34d47bb3fb6af95d0852df24903 Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Thu, 30 May 2024 12:22:01 -0500
Subject: [PATCH 26/29] doc updates

---
 README.md             |  8 ++++----
 docs/index.rst        | 29 +++++++++++++++++++----------
 docs/requirements.txt |  4 +++-
 pyproject.toml        |  4 ++--
 strprofiler/clastr.py | 18 +++++++++---------
 5 files changed, 37 insertions(+), 26 deletions(-)

diff --git a/README.md b/README.md
index 83b506c..7241480 100644
--- a/README.md
+++ b/README.md
@@ -8,7 +8,7 @@
 [![PyPI license](https://img.shields.io/pypi/l/strprofiler.svg)](https://pypi.python.org/pypi/strprofiler/)
 [![DOI](https://zenodo.org/badge/523477912.svg)](https://zenodo.org/badge/latestdoi/523477912)
 
-**STRprofiler** is a simple python utility to compare short tandem repeat (STR) profiles. In particular, it is designed to aid research labs in comparing models (e.g. cell lines & xenografts) generated from primary tissue samples to ensure contamination has not occurred. It includes basic checks for sample mixing and contamination.
+**STRprofiler** is a python package, CLI tool, and Shiny application to compare short tandem repeat (STR) profiles. In particular, it is designed to aid research labs in comparing models (e.g. cell lines & xenografts) generated from primary tissue samples to ensure contamination has not occurred. It includes basic checks for sample mixing and contamination and provides a simple interface to conveniently query the [Cellosaurus database via the CLASTR API](https://www.cellosaurus.org/str-search/).
 
 **STRprofiler is intended only for research purposes.**
 
@@ -201,7 +201,7 @@ New in v0.2.0 is `strprofiler-app`, a command that launches a Shiny application
 
 This application can provide a convenient portal to a group's STR database and can be hosted on standard Shiny servers, Posit Connect instances, or ShinyApps.io. 
 
-An example of the application can be seen [here](https://hg99x7-jared0andrews.shinyapps.io/strprofiler/).
+An example of the application can be seen [here](https:sj-bakerlab.shinyapps.io/strprofiler/).
 
 ### Deploying an `strprofiler` App
 
@@ -242,6 +242,6 @@ You can contribute by creating [issues](https://github.com/j-andrews7/strprofile
 
 ## Reference
 
-If you use **strprofiler** in your research, please cite the DOI:
+If you use **STRprofiler** in your research, please cite the DOI:
 
-Jared Andrews, Mike Lloyd, & Sam Culley. (2024). j-andrews7/strprofiler: v0.2.0 (v0.2.0). Zenodo. https://doi.org/10.5281/zenodo.7348386
+Jared Andrews, Mike Lloyd, & Sam Culley. (2024). j-andrews7/strprofiler: v0.3.0 (v0.3.0). Zenodo. https://doi.org/10.5281/zenodo.7348386
diff --git a/docs/index.rst b/docs/index.rst
index dc637c1..666b52c 100644
--- a/docs/index.rst
+++ b/docs/index.rst
@@ -54,10 +54,19 @@ Usage
 .. autofunction:: strprofiler.strprofiler.strprofiler
 
 
+Querying CLASTR
+===============
+
+**STRprofiler** can also be used to directly query CLASTR via their API. 
+This can be done from within the Shiny application or from the command line via the ``clastr`` command or using the ``clastr_query`` function directly:
+
+.. autofunction:: strprofiler.clastr.clastr_query
+
 Input Files(s)
 ~~~~~~~~~~~~~~
 
-**STRprofiler** can take either a single STR file or multiple STR files as input. These files can be csv, tsv, tab-separated text, or xlsx (first sheet used) files. The STR file(s) should be in either 'wide' or 'long' format. The long format expects all columns to map to the markers except for the designated sample name column with each row reflecting a different profile, e.g.:
+**STRprofiler** can take either a single STR file or multiple STR files as input. 
+These files can be csv, tsv, tab-separated text, or xlsx (first sheet used) files. The STR file(s) should be in either 'wide' or 'long' format. The long format expects all columns to map to the markers except for the designated sample name column with each row reflecting a different profile, e.g.:
 
 +--------+---------+---------+---------+--------+---------+--------+
 | Sample | D1S1656 |  DYS391 | D3S1358 | D2S441 | D16S539 | D5S818 | 
@@ -139,7 +148,7 @@ The wide format expects a line for each marker for each sample, e.g.:
 | Sample2      |  FGA      | 21          | 294.67  | 11941       |             |         |             |             |
 +--------------+-----------+-------------+---------+-------------+-------------+---------+-------------+-------------+
 
-In this format, the `marker_col` must be specified. Only columns beginning with "Allele" will be used to parse the alleles for each sample/marker. Any other size or height columns will be ignored.
+In this format, the ``marker_col`` must be specified. Only columns beginning with "Allele" will be used to parse the alleles for each sample/marker. Any other size or height columns will be ignored.
 
 Output Files
 ~~~~~~~~~~~~
@@ -201,16 +210,16 @@ Database Comparison
 
 In this mode, inputs are compared against the database samples only, and not among themselves. Outputs will be as described above for sample input(s).
 
-The `STRprofiler` App
-=====================
+The ``STRprofiler`` App
+=======================
 
-New in v0.2.0 is `strprofiler-app`, a command that launches a Shiny application that allows for user queries against an uploaded or pre-defined database (provided with the `-db` parameter) of STR profiles.
+New in v0.2.0 is ``strprofiler-app``, a CLI command that launches a Shiny application that allows for user queries against an uploaded or pre-defined database (provided with the `-db` parameter) of STR profiles.
 
 This application can provide a convenient portal to a group's STR database and can be hosted on standard Shiny servers, Posit Connect instances, or ShinyApps.io. 
 
-An example of the application can be seen `here <https://hg99x7-jared0andrews.shinyapps.io/strprofiler/>`__.
+An example of the application can be seen `here <https://sj-bakerlab.shinyapps.io/strprofiler/>`__.
 
-Deploying an ``strprofiler`` App
+Deploying an ``STRprofiler`` App
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 
 Building an app for deployment to any of the above options is simple.
@@ -258,13 +267,13 @@ You can contribute by creating `issues <https://github.com/j-andrews7/strprofile
 License
 =======
 
-**strprofiler** is released on the MIT license. You are free to use, modify, or redistribute it in almost any way, provided you state changes to the code, disclose the source, and use the same license. It is released with zero warranty for any purpose and I retain no liability for its use. `Read the full license <https://github.com/j-andrews7/strprofiler/blob/master/LICENSE>`_ for additional details.
+**STRprofiler** is released on the MIT license. You are free to use, modify, or redistribute it in almost any way, provided you state changes to the code, disclose the source, and use the same license. It is released with zero warranty for any purpose and I retain no liability for its use. `Read the full license <https://github.com/j-andrews7/strprofiler/blob/master/LICENSE>`_ for additional details.
 
 Reference
 =========
 
-If you use **strprofiler** in your research, please cite the following:
-Jared Andrews, Mike Lloyd, & Sam Culley. (2024). j-andrews7/strprofiler: v0.2.0 (v0.2.0). Zenodo. https://doi.org/10.5281/zenodo.7348386
+If you use **STRprofiler** in your research, please cite the following:
+Jared Andrews, Mike Lloyd, & Sam Culley. (2024). j-andrews7/strprofiler: v0.3.0 (v0.3.0). Zenodo. https://doi.org/10.5281/zenodo.7348386
 
 Indices and tables
 ==================
diff --git a/docs/requirements.txt b/docs/requirements.txt
index c262090..29ff6a2 100644
--- a/docs/requirements.txt
+++ b/docs/requirements.txt
@@ -6,4 +6,6 @@ shiny
 shinyswatch
 faicons
 requests
-flatten-json
\ No newline at end of file
+flatten-json
+json
+requests
\ No newline at end of file
diff --git a/pyproject.toml b/pyproject.toml
index 1c596cd..5701e43 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,7 +1,7 @@
 [tool.poetry]
 name = "strprofiler"
 version = "0.3.0"
-description = "A simple python utility to compare short tandem repeat (STR) profiles."
+description = "A python package, CLI tool, and Shiny application to compare short tandem repeat (STR) profiles."
 authors = ["Jared Andrews <jared.andrews07@gmail.com>",
            "Mike Lloyd <mike.lloyd@jax.org>"]
 license = "MIT"
@@ -25,7 +25,7 @@ flatten-json = "^0.1.14"
 
 [tool.poetry.scripts]
 strprofiler = 'strprofiler.strprofiler:strprofiler'
-clastr = 'strprofiler.clastr:clastr_batch_post_request'
+clastr = 'strprofiler.clastr:clastr_query'
 strprofiler-app = 'strprofiler.strprofiler:local_shiny_app'
 
 [build-system]
diff --git a/strprofiler/clastr.py b/strprofiler/clastr.py
index 82719ac..d961a10 100644
--- a/strprofiler/clastr.py
+++ b/strprofiler/clastr.py
@@ -102,7 +102,7 @@
 )
 @click.argument("input_files", required=True, type=click.Path(exists=True), nargs=-1)
 @click.version_option()
-def clastr_batch_post_request(
+def clastr_query(
     input_files,
     sample_map=None,
     output_dir="./STRprofiler",
@@ -116,35 +116,35 @@ def clastr_batch_post_request(
     penta_fix=True,
     score_amel=False,
 ):
-    """CLASTR_Query compares STR profiles to the human Cellosaurus knowledge base using the CLASTR REST API.
+    """clastr_query compares STR profiles to the human Cellosaurus knowledge base using the CLASTR REST API.
 
     :param input_files: List of input STR files in csv, xlsx, tsv, or txt format.
     :type input_files: click.Path
 
     :param sample_map: Path to sample map in csv format for renaming.
         First column should be sample names as given in STR file(s),
-        second should be new names to assign. No header., defaults to None
+        second should be new names to assign. No header. Defaults to None
     :type sample_map: str, optional
 
     :param output_dir: Path to output directory, defaults to "./STRprofiler"
     :type output_dir: str, optional
 
     :param search_algorithm: Search algorithm to use in the Clastr query, Options: 1 - Tanabe, 2 - Masters (vs. query); 3 - Masters (vs. reference)
-    defaults to 1 (tanabe).
+        Defaults to 1 (tanabe).
     :type search_algorithm: int
 
     :param scoring_mode: Search mode to account for missing alleles in query or reference.
-    Options: 1 - Non-empty markers, 2 - Query markers, 3 - Reference markers.
-    defaults to 1 ( Non-empty markers).
+        Options: 1 - Non-empty markers, 2 - Query markers, 3 - Reference markers.
+        Defaults to 1 ( Non-empty markers).
     :type search_algorithm: int
 
     :param score_filter: Minimum score to report as potential matches in summary table, defaults to 80
     :type score_filter: int, optional
 
     :param max_results: Filter defining the maximum number of results to be returned.
-    Note that in the case of conflicted cell lines, the Best and Worst versions are processed as pairs and only the best
-    score is affected by the threshold. Consequently, some Worst cases with a score below the threshold can still be present in the results.
-        defaults to 200
+        Note that in the case of conflicted cell lines, the Best and Worst versions are processed as pairs and only the best
+        score is affected by the threshold. Consequently, some Worst cases with a score below the threshold can still be present in the results.
+        Defaults to 200
     :type mix_threshold: int, optional
 
     :param min_markers: Filter defining the minimum number of markers for matches to be reported, defaults to 8.

From fdeda548f97eb8588d3206a94371f6f1d999a269 Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Thu, 30 May 2024 12:55:26 -0500
Subject: [PATCH 27/29] format README

---
 README.md | 86 +++++++++++++++++++++++++++++++++++--------------------
 1 file changed, 55 insertions(+), 31 deletions(-)

diff --git a/README.md b/README.md
index 7241480..c059744 100644
--- a/README.md
+++ b/README.md
@@ -49,23 +49,37 @@ Full usage information can be found by running `strprofiler --help`.
 
  STRprofiler compares STR profiles to each other.  
 
-╭─ Options ─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╮
-│ --tan_threshold    -tanth   FLOAT    Minimum Tanabe score to report as potential matches in summary table. [default: 80]                                                                          │
-│ --mas_q_threshold  -masqth  FLOAT    Minimum Masters (vs. query) score to report as potential matches in summary table. [default: 80]                                                             │
-│ --mas_r_threshold  -masrth  FLOAT    Minimum Masters (vs. reference) score to report as potential matches in summary table. [default: 80]                                                         │
-│ --mix_threshold    -mix     INTEGER  Number of markers with >= 2 alleles allowed before a sample is flagged for potential mixing. [default: 3]                                                    │
-│ --sample_map       -sm      PATH     Path to sample map in csv format for renaming. First column should be sample names as given in STR file(s), second should be new names to assign. No header. │
-│ --database         -db      PATH     Path to an STR database file in csv, xlsx, tsv, or txt format.                                                                                               │
-│ --amel_col         -acol    TEXT     Name of Amelogenin column in STR file(s). [default: AMEL]                                                                                                    │
-│ --sample_col       -scol    TEXT     Name of sample column in STR file(s). [default: Sample]                                                                                                      │
-│ --marker_col       -mcol    TEXT     Name of marker column in STR file(s). Only used if format is 'wide'. [default: Marker]                                                                       │
-│ --penta_fix        -pfix             Whether to try to harmonize PentaE/D allele spelling. [default: True]                                                                                        │
-│ --score_amel       -amel             Use Amelogenin for similarity scoring. [default: False]                                                                                                      │
-│ --output_dir       -o       PATH     Path to the output directory. [default: ./STRprofiler]                                                                                                       │
-│ --version                            Show the version and exit.                                                                                                                                   │
-│ --help                               Show this message and exit.                                                                                                                                  │
-╰───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯
-
+╭─ Options ────────────────────────────────────────────────────────────────────────────────╮
+│ --tan_threshold    -tanth   FLOAT    Minimum Tanabe score to report as potential matches |
+|                                      in summary table. [default: 80]                     │
+│ --mas_q_threshold  -masqth  FLOAT    Minimum Masters (vs. query) score to report as      |
+|                                      potential matches in summary table. [default: 80]   │
+│ --mas_r_threshold  -masrth  FLOAT    Minimum Masters (vs. reference) score to report as  |
+|                                      potential matches in summary table. [default: 80]   │
+│ --mix_threshold    -mix     INTEGER  Number of markers with >= 2 alleles allowed before  |
+|                                      a sample is flagged for potential mixing.           |
+|                                      [default: 3]                                        │
+│ --sample_map       -sm      PATH     Path to sample map in csv format for renaming.      |
+|                                      First column should be sample names as given in     |
+|                                      STR file(s), second should be new names to assign.  | 
+|                                      No header.                                          │
+│ --database         -db      PATH     Path to an STR database file in csv, xlsx, tsv,     |
+|                                      or txt format.                                      │
+│ --amel_col         -acol    STR      Name of Amelogenin column in STR file(s).           |
+|                                      [default: 'AMEL']                                   │
+│ --sample_col       -scol    STR      Name of sample column in STR file(s).               |
+|                                      [default: 'Sample']                                 │
+│ --marker_col       -mcol    STR      Name of marker column in STR file(s).               |
+|                                      Only used if format is 'wide'. [default: 'Marker']  │
+│ --penta_fix        -pfix    FLAG     Whether to try to harmonize PentaE/D allele         |
+|                                      spelling. [default: True]                           │
+│ --score_amel       -amel    FLAG     Use Amelogenin for similarity scoring.              |
+|                                      [default: False]                                    │
+│ --output_dir       -o       PATH     Path to the output directory.                       |
+|                                     [default: ./STRprofiler]                             │
+│ --version                            Show the version and exit.                          │
+│ --help                               Show this message and exit                          │
+╰──────────────────────────────────────────────────────────────────────────────────────────╯
 ```
 
 **CLASTR**
@@ -86,20 +100,30 @@ Full usage information can be found by running `clastr --help`.
 
 **clastr** compares STR profiles to the human Cellosaurus knowledge base using the CLASTR REST API.  
 
-╭─ Options ───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╮
-│ --search_algorithm  -sa    INTEGER  Search algorithm to use in the Clastr query. 1 - Tanabe, 2 - Masters (vs. query); 3 - Masters (vs. reference) [default: 1]                      │
-│ --scoring_mode      -sm    INTEGER  Search mode to account for missing alleles in query or reference. 1 - Non-empty markers, 2 - Query markers, 3 - Reference markers. [default: 1] │
-│ --score_filter      -sf    INTEGER  Minimum score to report as potential matches in summary table. [default: 80]                                                                    │
-│ --max_results       -mr    INTEGER  Filter defining the maximum number of results to be returned. [default: 200]                                                                    │
-│ --min_markers       -mm    INTEGER  Filter defining the minimum number of markers for matches to be reported. [default: 8]                                                          │
-│ --sample_col        -scol  TEXT     Name of sample column in STR file(s). [default: Sample]                                                                                         │
-│ --marker_col        -mcol  TEXT     Name of marker column in STR file(s). Only used if format is 'wide'. [default: Marker]                                                          │
-│ --penta_fix         -pfix           Whether to try to harmonize PentaE/D allele spelling. [default: True]                                                                           │
-│ --score_amel        -amel           Use Amelogenin for similarity scoring. [default: False]                                                                                         │
-│ --output_dir        -o     PATH     Path to the output directory. [default: ./STRprofiler]                                                                                          │
-│ --version                           Show the version and exit.                                                                                                                      │
-│ --help                              Show this message and exit.                                                                                                                     │
-╰─────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────╯
+╭─ Options ────────────────────────────────────────────────────────────────────────────────╮
+│ --search_algorithm  -sa    INT  Search algorithm to use in the CLASTR query.             |
+|                                 1 - Tanabe, 2 - Masters (vs. query);                     |
+|                                 3 - Masters (vs. reference) [default: 1]                 │
+│ --scoring_mode      -sm    INT  Search mode to account for missing alleles in query or   |
+|                                 reference. 1 - Non-empty markers, 2 - Query markers,     |
+|                                 3 - Reference markers. [default: 1]                      │
+│ --score_filter      -sf    INT  Minimum score to report as potential matches in          |
+|                                 summary table. [default: 80]                             │
+│ --max_results       -mr    INT  Filter defining the maximum number of results to be      |
+|                                 returned. [default: 200]                                 │
+│ --min_markers       -mm    INT  Filter defining the minimum number of markers for        |
+|                                 matches to be reported. [default: 8]                     │
+│ --sample_col        -scol  STR  Name of sample column in STR file(s).                    |
+|                                 [default: 'Sample']                                      │
+│ --marker_col        -mcol  STR  Name of marker column in STR file(s).                    |
+|                                 Only used if format is 'wide'. [default: 'Marker']       │
+│ --penta_fix         -pfix  FLAG Whether to try to harmonize PentaE/D allele spelling.    |
+|                                 [default: True]                                          │
+│ --score_amel        -amel  FLAG Use Amelogenin for similarity scoring. [default: False]  │
+│ --output_dir        -o     PATH Path to the output directory. [default: ./STRprofiler]   │
+│ --version                       Show the version and exit.                               │
+│ --help                          Show this message and exit.                              │
+╰──────────────────────────────────────────────────────────────────────────────────────────╯
 
 ```
 

From 8f0588d1cf24acd58dd57e7da51a1eaf6346ebd4 Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Thu, 30 May 2024 12:58:30 -0500
Subject: [PATCH 28/29] add CLASTR reference

---
 README.md | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/README.md b/README.md
index c059744..9689dba 100644
--- a/README.md
+++ b/README.md
@@ -86,11 +86,6 @@ Full usage information can be found by running `strprofiler --help`.
 
 Additionally, the [Cellosaurus](https://www.cellosaurus.org/description.html) (Bairoch, 2018) cell line database can be queried via the [CLASTR](https://www.cellosaurus.org/str-search/) (Robin, Capes-Davis, and Bairoch, 2019) [REST API](https://www.cellosaurus.org/str-search/help.html#5).  
 
-    Bairoch A. (2018) The Cellosaurus, a cell line knowledge resource. Journal of Biomolecular Techniques. 29:25-38. DOI: 10.7171/jbt.18-2902-002; PMID: 29805321 
-
-    Robin, T., Capes-Davis, A. & Bairoch, A. (2019) CLASTR: the Cellosaurus STR Similarity Search Tool - A Precious Help for Cell Line Authentication. International Journal of Cancer. PubMed: 31444973  DOI: 10.1002/IJC.32639
-
-
 `clastr -sm "SampleMap_exp.csv" -scol "Sample Name" -o ./strprofiler_output STR1.xlsx STR2.csv STR3.txt`
 
 Full usage information can be found by running `clastr --help`.
@@ -264,8 +259,14 @@ You can contribute by creating [issues](https://github.com/j-andrews7/strprofile
 
 **STRprofiler** is released on the MIT license. You are free to use, modify, or redistribute it in almost any way, provided you state changes to the code, disclose the source, and use the same license. It is released with zero warranty for any purpose and the authors retain no liability for its use. [Read the full license](https://github.com/j-andrews7/strprofiler/blob/master/LICENSE) for additional details.
 
-## Reference
+## References
 
 If you use **STRprofiler** in your research, please cite the DOI:
 
 Jared Andrews, Mike Lloyd, & Sam Culley. (2024). j-andrews7/strprofiler: v0.3.0 (v0.3.0). Zenodo. https://doi.org/10.5281/zenodo.7348386
+
+If you use the `clastr` command or functionality from the Shiny application, please cite the Cellosaurus and CLASTR publications:
+
+Bairoch A. (2018) The Cellosaurus, a cell line knowledge resource. Journal of Biomolecular Techniques. 29:25-38. DOI: 10.7171/jbt.18-2902-002; PMID: 29805321 
+
+Robin, T., Capes-Davis, A. & Bairoch, A. (2019) CLASTR: the Cellosaurus STR Similarity Search Tool - A Precious Help for Cell Line Authentication. International Journal of Cancer. PubMed: 31444973  DOI: 10.1002/IJC.32639
\ No newline at end of file

From c1d8fcfcbc8cc76144e834bd2758d84e9167e367 Mon Sep 17 00:00:00 2001
From: Jared Andrews <jared.andrews07@gmail.com>
Date: Thu, 30 May 2024 12:59:06 -0500
Subject: [PATCH 29/29] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 9689dba..f474ff9 100644
--- a/README.md
+++ b/README.md
@@ -93,7 +93,7 @@ Full usage information can be found by running `clastr --help`.
 ```bash
  Usage: clastr [OPTIONS] INPUT_FILES...   
 
-**clastr** compares STR profiles to the human Cellosaurus knowledge base using the CLASTR REST API.  
+**clastr** compares STR profiles to the human Cellosaurus knowledge base using the CLASTR REST API.
 
 ╭─ Options ────────────────────────────────────────────────────────────────────────────────╮
 │ --search_algorithm  -sa    INT  Search algorithm to use in the CLASTR query.             |