From 16cc35a1624a970e505f063c5e1cfc34d49d71c9 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 15 Jul 2024 13:39:43 -0400
Subject: [PATCH 01/36] Update STR data pipeline for new data

Major changes here are:

* Instead of a single `reference_region`, STRs now have a list of `reference_regions` with a single one designated the `main_reference_region`
* Allele size distributions and genotype distributions were previously represented with an attempt to represent multidimensional data with a number of nested structs, which was serviceable when there were only one or two dimensions we might want to filter on, but was getting increasingly convoluted. Since this new data expands the number of dimensions further, rather than build on the former schema and confuse things more, these distributions are now represented with a flattened list of structs each of which represents a single subset of the distribution.
---
 .../gnomad_v3_short_tandem_repeats.py         | 529 ++++--------------
 .../pipelines/export_to_elasticsearch.py      |   2 +-
 .../gnomad_v3_short_tandem_repeats.py         |   4 +-
 3 files changed, 106 insertions(+), 429 deletions(-)

diff --git a/data-pipeline/src/data_pipeline/datasets/gnomad_v3/gnomad_v3_short_tandem_repeats.py b/data-pipeline/src/data_pipeline/datasets/gnomad_v3/gnomad_v3_short_tandem_repeats.py
index e27fa872d..901fca3e5 100644
--- a/data-pipeline/src/data_pipeline/datasets/gnomad_v3/gnomad_v3_short_tandem_repeats.py
+++ b/data-pipeline/src/data_pipeline/datasets/gnomad_v3/gnomad_v3_short_tandem_repeats.py
@@ -1,6 +1,4 @@
-import itertools
 import json
-from collections import defaultdict
 
 import hail as hl
 
@@ -8,12 +6,8 @@
 def _parse_region_id(region_id):
     [chrom, position_range] = region_id.split(":")
     chrom = chrom[3:]
-    [start, stop] = map(int, position_range.split("-"))
-    return {
-        "chrom": chrom,
-        "start": start,
-        "stop": stop,
-    }
+    [start, stop] = list(map(int, position_range.split("-")))
+    return {"chrom": chrom, "start": start, "stop": stop, "reference_genome": "GRCh38"}
 
 
 def _prepare_histogram(histogram):
@@ -23,161 +17,6 @@ def _prepare_histogram(histogram):
     )
 
 
-def _population_sort_key(pop):
-    pop_id = pop["id"]
-    if pop_id == "XX" or pop_id == "XY":
-        return ("zzz", pop_id)
-
-    if "_" in pop_id:
-        return tuple(pop_id.split("_"))
-
-    return (pop_id, "")
-
-
-def _get_total_histogram(histogram):
-    total = defaultdict(int)
-    for v in histogram.values():
-        for k, n in v.items():
-            total[k] += n
-
-    return total
-
-
-def _prepare_allele_size_distribution_populations(locus):
-    populations = sorted(set(key.split("/")[0] for key in locus["AlleleCountHistogram"].keys()))
-
-    distributions = sorted(
-        list(
-            itertools.chain.from_iterable(
-                [
-                    {
-                        "id": population,
-                        "distribution": _prepare_histogram(
-                            _get_total_histogram(
-                                {
-                                    k: v
-                                    for k, v in locus["AlleleCountHistogram"].items()
-                                    if k.split("/")[0] == population
-                                }
-                            )
-                        ),
-                    },
-                    {
-                        "id": f"{population}_XX",
-                        "distribution": _prepare_histogram(
-                            _get_total_histogram(
-                                {
-                                    k: v
-                                    for k, v in locus["AlleleCountHistogram"].items()
-                                    if k.split("/")[0] == population and k.split("/")[1] == "XX"
-                                }
-                            )
-                        ),
-                    },
-                    {
-                        "id": f"{population}_XY",
-                        "distribution": _prepare_histogram(
-                            _get_total_histogram(
-                                {
-                                    k: v
-                                    for k, v in locus["AlleleCountHistogram"].items()
-                                    if k.split("/")[0] == population and k.split("/")[1] == "XY"
-                                }
-                            )
-                        ),
-                    },
-                ]
-                for population in populations
-            )
-        )
-        + [
-            {
-                "id": sex,
-                "distribution": _prepare_histogram(
-                    _get_total_histogram(
-                        {k: v for k, v in locus["AlleleCountHistogram"].items() if k.split("/")[1] == sex}
-                    )
-                ),
-            }
-            for sex in ["XX", "XY"]
-        ],
-        key=_population_sort_key,
-    )
-
-    return [distribution for distribution in distributions if distribution["distribution"]]
-
-
-def _prepare_allele_size_distribution_repeat_units(locus):
-    repeat_units = sorted(set(key.split("/")[2] for key in locus["AlleleCountHistogram"].keys()))
-    populations = sorted(set(key.split("/")[0] for key in locus["AlleleCountHistogram"].keys()))
-
-    distributions = sorted(
-        [
-            {
-                "repeat_unit": repeat_unit,
-                "distribution": _prepare_histogram(
-                    _get_total_histogram(
-                        {k: v for k, v in locus["AlleleCountHistogram"].items() if k.split("/")[2] == repeat_unit}
-                    )
-                ),
-                "populations": sorted(
-                    list(
-                        itertools.chain.from_iterable(
-                            [
-                                {
-                                    "id": population,
-                                    "distribution": _prepare_histogram(
-                                        _get_total_histogram(
-                                            {
-                                                k: v
-                                                for k, v in locus["AlleleCountHistogram"].items()
-                                                if k.split("/")[2] == repeat_unit and k.split("/")[0] == population
-                                            }
-                                        )
-                                    ),
-                                },
-                                {
-                                    "id": f"{population}_XX",
-                                    "distribution": _prepare_histogram(
-                                        locus["AlleleCountHistogram"].get(f"{population}/XX/{repeat_unit}", {})
-                                    ),
-                                },
-                                {
-                                    "id": f"{population}_XY",
-                                    "distribution": _prepare_histogram(
-                                        locus["AlleleCountHistogram"].get(f"{population}/XY/{repeat_unit}", {})
-                                    ),
-                                },
-                            ]
-                            for population in populations
-                        )
-                    )
-                    + [
-                        {
-                            "id": sex,
-                            "distribution": _prepare_histogram(
-                                _get_total_histogram(
-                                    {
-                                        k: v
-                                        for k, v in locus["AlleleCountHistogram"].items()
-                                        if k.split("/")[2] == repeat_unit and k.split("/")[1] == sex
-                                    }
-                                )
-                            ),
-                        }
-                        for sex in ["XX", "XY"]
-                    ],
-                    key=_population_sort_key,
-                ),
-            }
-            for repeat_unit in repeat_units
-        ],
-        key=lambda r: (len(r["repeat_unit"]), r["repeat_unit"]),
-    )
-
-    return [distribution for distribution in distributions if distribution["distribution"]]
-
-
 def _prepare_age_distribution(locus):
     age_bins = [
         ("<20", None, 20),
@@ -205,192 +44,6 @@ def _prepare_age_distribution(locus):
     ]
 
 
-def _prepare_genotype_distribution_histogram(histogram):
-    return sorted(
-        ([*(int(n) for n in n_repeats.split("/")), n_samples] for n_repeats, n_samples in histogram.items()),
-        key=lambda value: (value[0], value[1]),
-    )
-
-
-def _filter_genotype_distribution_histogram(histogram, repeat_units=None, population=None, sex=None):
-    predicates = []
-    if repeat_units:
-        predicates.append(
-            lambda key: tuple(sorted(key.split("/")[2:4])) in (repeat_units, tuple(reversed(repeat_units)))
-        )
-    if population:
-        predicates.append(lambda key: key.split("/")[0] == population)
-    if sex:
-        predicates.append(lambda key: key.split("/")[1] == sex)
-
-    filtered_histogram = {k: v for k, v in histogram.items() if all(predicate(k) for predicate in predicates)}
-
-    if not repeat_units:
-        return filtered_histogram
-
-    return dict(
-        itertools.chain(
-            ((k, v) for k, v in filtered_histogram.items() if tuple(k.split("/")[2:4]) == repeat_units),
-            (
-                (f"{k}-reversed", {"/".join(reversed(vk.split("/"))): vv for vk, vv in v.items()})
-                for k, v in filtered_histogram.items()
-                if tuple(k.split("/")[2:4]) == tuple(reversed(repeat_units))
-                and tuple(k.split("/")[2:4]) != repeat_units
-            ),
-        )
-    )
-
-
-def _prepare_genotype_distribution_populations(locus):
-    populations = sorted(set(key.split("/")[0] for key in locus["AlleleCountScatterPlot"].keys()))
-
-    distributions = sorted(
-        list(
-            itertools.chain.from_iterable(
-                [
-                    {
-                        "id": population,
-                        "distribution": _prepare_genotype_distribution_histogram(
-                            _get_total_histogram(
-                                _filter_genotype_distribution_histogram(
-                                    locus["AlleleCountScatterPlot"], population=population
-                                )
-                            )
-                        ),
-                    },
-                    {
-                        "id": f"{population}_XX",
-                        "distribution": _prepare_genotype_distribution_histogram(
-                            _get_total_histogram(
-                                _filter_genotype_distribution_histogram(
-                                    locus["AlleleCountScatterPlot"], population=population, sex="XX"
-                                )
-                            )
-                        ),
-                    },
-                    {
-                        "id": f"{population}_XY",
-                        "distribution": _prepare_genotype_distribution_histogram(
-                            _get_total_histogram(
-                                _filter_genotype_distribution_histogram(
-                                    locus["AlleleCountScatterPlot"], population=population, sex="XY"
-                                )
-                            )
-                        ),
-                    },
-                ]
-                for population in populations
-            )
-        )
-        + [
-            {
-                "id": sex,
-                "distribution": _prepare_genotype_distribution_histogram(
-                    _get_total_histogram(
-                        _filter_genotype_distribution_histogram(locus["AlleleCountScatterPlot"], sex=sex)
-                    )
-                ),
-            }
-            for sex in ["XX", "XY"]
-        ],
-        key=_population_sort_key,
-    )
-
-    return [distribution for distribution in distributions if distribution["distribution"]]
-
-
-def _prepare_genotype_distribution_repeat_units(locus):
-    repeat_unit_pairs = sorted(
-        set(tuple(sorted(key.split("/")[2:4])) for key in locus["AlleleCountScatterPlot"].keys())
-    )
-    populations = sorted(set(key.split("/")[0] for key in locus["AlleleCountScatterPlot"].keys()))
-
-    distributions = sorted(
-        [
-            {
-                "repeat_units": list(repeat_unit_pair),
-                "distribution": _prepare_genotype_distribution_histogram(
-                    _get_total_histogram(
-                        _filter_genotype_distribution_histogram(
-                            locus["AlleleCountScatterPlot"], repeat_units=repeat_unit_pair
-                        )
-                    )
-                ),
-                "populations": sorted(
-                    list(
-                        itertools.chain.from_iterable(
-                            [
-                                {
-                                    "id": population,
-                                    "distribution": _prepare_genotype_distribution_histogram(
-                                        _get_total_histogram(
-                                            _filter_genotype_distribution_histogram(
-                                                locus["AlleleCountScatterPlot"],
-                                                repeat_units=repeat_unit_pair,
-                                                population=population,
-                                            )
-                                        )
-                                    ),
-                                },
-                                {
-                                    "id": f"{population}_XX",
-                                    "distribution": _prepare_genotype_distribution_histogram(
-                                        _get_total_histogram(
-                                            _filter_genotype_distribution_histogram(
-                                                locus["AlleleCountScatterPlot"],
-                                                repeat_units=repeat_unit_pair,
-                                                population=population,
-                                                sex="XX",
-                                            )
-                                        )
-                                    ),
-                                },
-                                {
-                                    "id": f"{population}_XY",
-                                    "distribution": _prepare_genotype_distribution_histogram(
-                                        _get_total_histogram(
-                                            _filter_genotype_distribution_histogram(
-                                                locus["AlleleCountScatterPlot"],
-                                                repeat_units=repeat_unit_pair,
-                                                population=population,
-                                                sex="XY",
-                                            )
-                                        )
-                                    ),
-                                },
-                            ]
-                            for population in populations
-                        )
-                    )
-                    + [
-                        {
-                            "id": sex,
-                            "distribution": _prepare_genotype_distribution_histogram(
-                                _get_total_histogram(
-                                    _filter_genotype_distribution_histogram(
-                                        locus["AlleleCountScatterPlot"], repeat_units=repeat_unit_pair, sex=sex
-                                    )
-                                )
-                            ),
-                        }
-                        for sex in ["XX", "XY"]
-                    ],
-                    key=_population_sort_key,
-                ),
-            }
-            for repeat_unit_pair in repeat_unit_pairs
-        ],
-        key=lambda r: (
-            len(r["repeat_units"][0]),
-            len(r["repeat_units"][1]),
-            r["repeat_units"][0],
-            r["repeat_units"][1],
-        ),
-    )
-
-    return [distribution for distribution in distributions if distribution["distribution"]]
-
-
 def _prepare_disease_repeat_size_classifications(disease):
     ranges = []
 
@@ -414,6 +67,63 @@ def _prepare_disease_repeat_size_classifications(disease):
 }
 
 
+def _parse_allele_count_histogram_section(cohort_key, distribution):
+    [ancestry_group, sex, repunit, quality_description, q_score] = cohort_key.split("/")
+    return {
+        "ancestry_group": ancestry_group,
+        "sex": sex,
+        "repunit": repunit,
+        "quality_description": quality_description.lower(),
+        "q_score": float(q_score),
+        "distribution": [{"repunit_count": int(k), "frequency": v} for k, v in distribution.items()],
+    }
+
+
+def _prepare_allele_size_distribution(allele_count_histogram):
+    return [_parse_allele_count_histogram_section(k, v) for (k, v) in allele_count_histogram.items()]
+
+
+def _parse_allele_scatter_plot_item(item):
+    (key, value) = item
+    [short_allele_repunit_count, long_allele_repunit_count] = key.split("/")
+    return {
+        "short_allele_repunit_count": int(short_allele_repunit_count),
+        "long_allele_repunit_count": int(long_allele_repunit_count),
+        "frequency": value,
+    }
+
+
+def _parse_allele_scatter_plot_distribution(distribution):
+    return list(map(_parse_allele_scatter_plot_item, distribution.items()))
+
+
+def _parse_allele_scatter_plot_histogram_section(cohort_key, distribution):
+    [ancestry_group, sex, short_allele_repunit, long_allele_repunit, quality_description, q_score] = cohort_key.split(
+        "/"
+    )
+    return {
+        "ancestry_group": ancestry_group,
+        "sex": sex,
+        "short_allele_repunit": short_allele_repunit,
+        "long_allele_repunit": long_allele_repunit,
+        "quality_description": quality_description,
+        "q_score": float(q_score),
+        "distribution": _parse_allele_scatter_plot_distribution(distribution),
+    }
+
+
+def _prepare_genotype_distribution(allele_scatter_plot_histogram):
+    return [_parse_allele_scatter_plot_histogram_section(k, v) for k, v in allele_scatter_plot_histogram.items()]
+
+
+def _parse_reference_regions(regions):
+    # "regions" may be a single string or list of strings
+
+    if type(regions) == str:
+        return [_parse_region_id(regions)]
+    return list(map(_parse_region_id, regions))
+
+
 def prepare_gnomad_v3_short_tandem_repeats(path):
     with hl.hadoop_open(path) as input_file:
         data = json.load(input_file)
@@ -435,7 +145,8 @@ def prepare_gnomad_v3_short_tandem_repeats(path):
                 for disease in locus["Diseases"]
             ],
             "stripy_id": locus["STRipyName"] if "STRipyName" in locus else None,
-            "reference_region": {"reference_genome": "GRCh38", **_parse_region_id(locus["ReferenceRegion"])},
+            "main_reference_region": _parse_region_id(locus["MainReferenceRegion"]),
+            "reference_regions": _parse_reference_regions(locus["ReferenceRegion"]),
             "reference_repeat_unit": locus["ReferenceRepeatUnit"],
             "repeat_units": sorted(
                 (
@@ -456,18 +167,8 @@ def prepare_gnomad_v3_short_tandem_repeats(path):
                 ),
                 key=lambda r: (len(r["repeat_unit"]), r["repeat_unit"]),
             ),
-            "allele_size_distribution": {
-                "distribution": _prepare_histogram(_get_total_histogram(locus["AlleleCountHistogram"])),
-                "populations": _prepare_allele_size_distribution_populations(locus),
-                "repeat_units": _prepare_allele_size_distribution_repeat_units(locus),
-            },
-            "genotype_distribution": {
-                "distribution": _prepare_genotype_distribution_histogram(
-                    _get_total_histogram(locus["AlleleCountScatterPlot"])
-                ),
-                "populations": _prepare_genotype_distribution_populations(locus),
-                "repeat_units": _prepare_genotype_distribution_repeat_units(locus),
-            },
+            "allele_size_distribution": _prepare_allele_size_distribution(locus["AlleleCountHistogram"]),
+            "genotype_distribution": _prepare_genotype_distribution(locus["AlleleCountScatterPlot"]),
             "age_distribution": _prepare_age_distribution(locus),
             "adjacent_repeats": sorted(
                 [
@@ -482,20 +183,12 @@ def prepare_gnomad_v3_short_tandem_repeats(path):
                             set(k.split("/")[2] for k in adjacent_repeat["AlleleCountHistogram"].keys()),
                             key=lambda repeat_unit: (len(repeat_unit), repeat_unit),
                         ),
-                        "allele_size_distribution": {
-                            "distribution": _prepare_histogram(
-                                _get_total_histogram(adjacent_repeat["AlleleCountHistogram"])
-                            ),
-                            "populations": _prepare_allele_size_distribution_populations(adjacent_repeat),
-                            "repeat_units": _prepare_allele_size_distribution_repeat_units(adjacent_repeat),
-                        },
-                        "genotype_distribution": {
-                            "distribution": _prepare_genotype_distribution_histogram(
-                                _get_total_histogram(adjacent_repeat["AlleleCountScatterPlot"])
-                            ),
-                            "populations": _prepare_genotype_distribution_populations(adjacent_repeat),
-                            "repeat_units": _prepare_genotype_distribution_repeat_units(adjacent_repeat),
-                        },
+                        "allele_size_distribution": _prepare_allele_size_distribution(
+                            adjacent_repeat["AlleleCountHistogram"]
+                        ),
+                        "genotype_distribution": _prepare_genotype_distribution(
+                            adjacent_repeat["AlleleCountScatterPlot"]
+                        ),
                         "age_distribution": _prepare_age_distribution(adjacent_repeat),
                     }
                     for adjacent_repeat_id, adjacent_repeat in locus.get("AdjacentRepeats", {}).items()
@@ -506,7 +199,31 @@ def prepare_gnomad_v3_short_tandem_repeats(path):
         for locus in data.values()
     ]
 
-    return hl.Table.parallelize(
+    allele_size_distribution_schema = hl.tarray(
+        hl.tstruct(
+            ancestry_group=hl.tstr,
+            sex=hl.tstr,
+            repunit=hl.tstr,
+            quality_description=hl.tstr,
+            q_score=hl.tfloat,
+            distribution=hl.tarray(hl.tstruct(repunit_count=hl.tint, frequency=hl.tint)),
+        )
+    )
+    genotype_distribution_schema = hl.tarray(
+        hl.tstruct(
+            ancestry_group=hl.tstr,
+            sex=hl.tstr,
+            short_allele_repunit=hl.tstr,
+            long_allele_repunit=hl.tstr,
+            quality_description=hl.tstr,
+            q_score=hl.tfloat,
+            distribution=hl.tarray(
+                hl.tstruct(short_allele_repunit_count=hl.tint, long_allele_repunit_count=hl.tint, frequency=hl.tfloat)
+            ),
+        )
+    )
+
+    ds = hl.Table.parallelize(
         ds,
         hl.tstruct(
             id=hl.tstr,
@@ -521,31 +238,14 @@ def prepare_gnomad_v3_short_tandem_repeats(path):
                     notes=hl.tstr,
                 )
             ),
-            reference_region=hl.tstruct(reference_genome=hl.tstr, chrom=hl.tstr, start=hl.tint, stop=hl.tint),
+            main_reference_region=hl.tstruct(reference_genome=hl.tstr, chrom=hl.tstr, start=hl.tint, stop=hl.tint),
+            reference_regions=hl.tarray(
+                hl.tstruct(reference_genome=hl.tstr, chrom=hl.tstr, start=hl.tint, stop=hl.tint)
+            ),
             reference_repeat_unit=hl.tstr,
             repeat_units=hl.tarray(hl.tstruct(repeat_unit=hl.tstr, classification=hl.tstr)),
-            allele_size_distribution=hl.tstruct(
-                distribution=hl.tarray(hl.tarray(hl.tint)),
-                populations=hl.tarray(hl.tstruct(id=hl.tstr, distribution=hl.tarray(hl.tarray(hl.tint)))),
-                repeat_units=hl.tarray(
-                    hl.tstruct(
-                        repeat_unit=hl.tstr,
-                        distribution=hl.tarray(hl.tarray(hl.tint)),
-                        populations=hl.tarray(hl.tstruct(id=hl.tstr, distribution=hl.tarray(hl.tarray(hl.tint)))),
-                    )
-                ),
-            ),
-            genotype_distribution=hl.tstruct(
-                distribution=hl.tarray(hl.tarray(hl.tint)),
-                populations=hl.tarray(hl.tstruct(id=hl.tstr, distribution=hl.tarray(hl.tarray(hl.tint)))),
-                repeat_units=hl.tarray(
-                    hl.tstruct(
-                        repeat_units=hl.tarray(hl.tstr),
-                        distribution=hl.tarray(hl.tarray(hl.tint)),
-                        populations=hl.tarray(hl.tstruct(id=hl.tstr, distribution=hl.tarray(hl.tarray(hl.tint)))),
-                    )
-                ),
-            ),
+            allele_size_distribution=allele_size_distribution_schema,
+            genotype_distribution=genotype_distribution_schema,
             age_distribution=hl.tarray(
                 hl.tstruct(age_range=hl.tarray(hl.tint), distribution=hl.tarray(hl.tarray(hl.tint)))
             ),
@@ -556,32 +256,8 @@ def prepare_gnomad_v3_short_tandem_repeats(path):
                     reference_region=hl.tstruct(reference_genome=hl.tstr, chrom=hl.tstr, start=hl.tint, stop=hl.tint),
                     reference_repeat_unit=hl.tstr,
                     repeat_units=hl.tarray(hl.tstr),
-                    allele_size_distribution=hl.tstruct(
-                        distribution=hl.tarray(hl.tarray(hl.tint)),
-                        populations=hl.tarray(hl.tstruct(id=hl.tstr, distribution=hl.tarray(hl.tarray(hl.tint)))),
-                        repeat_units=hl.tarray(
-                            hl.tstruct(
-                                repeat_unit=hl.tstr,
-                                distribution=hl.tarray(hl.tarray(hl.tint)),
-                                populations=hl.tarray(
-                                    hl.tstruct(id=hl.tstr, distribution=hl.tarray(hl.tarray(hl.tint)))
-                                ),
-                            )
-                        ),
-                    ),
-                    genotype_distribution=hl.tstruct(
-                        distribution=hl.tarray(hl.tarray(hl.tint)),
-                        populations=hl.tarray(hl.tstruct(id=hl.tstr, distribution=hl.tarray(hl.tarray(hl.tint)))),
-                        repeat_units=hl.tarray(
-                            hl.tstruct(
-                                repeat_units=hl.tarray(hl.tstr),
-                                distribution=hl.tarray(hl.tarray(hl.tint)),
-                                populations=hl.tarray(
-                                    hl.tstruct(id=hl.tstr, distribution=hl.tarray(hl.tarray(hl.tint)))
-                                ),
-                            )
-                        ),
-                    ),
+                    allele_size_distribution=allele_size_distribution_schema,
+                    genotype_distribution=genotype_distribution_schema,
                     age_distribution=hl.tarray(
                         hl.tstruct(age_range=hl.tarray(hl.tint), distribution=hl.tarray(hl.tarray(hl.tint)))
                     ),
@@ -590,3 +266,4 @@ def prepare_gnomad_v3_short_tandem_repeats(path):
         ),
         n_partitions=1,
     )
+    return ds
diff --git a/data-pipeline/src/data_pipeline/pipelines/export_to_elasticsearch.py b/data-pipeline/src/data_pipeline/pipelines/export_to_elasticsearch.py
index 9ddfa8b7b..e91b9d2d3 100644
--- a/data-pipeline/src/data_pipeline/pipelines/export_to_elasticsearch.py
+++ b/data-pipeline/src/data_pipeline/pipelines/export_to_elasticsearch.py
@@ -284,7 +284,7 @@ def add_liftover_document_id(ds):
         ),
         "args": {
             "index": "gnomad_v3_short_tandem_repeats",
-            "index_fields": ["id", "gene.ensembl_id", "reference_region"],
+            "index_fields": ["id", "gene.ensembl_id", "main_reference_region"],
             "id_field": "id",
             "num_shards": 1,
         },
diff --git a/data-pipeline/src/data_pipeline/pipelines/gnomad_v3_short_tandem_repeats.py b/data-pipeline/src/data_pipeline/pipelines/gnomad_v3_short_tandem_repeats.py
index 04848c871..f303e7ed7 100644
--- a/data-pipeline/src/data_pipeline/pipelines/gnomad_v3_short_tandem_repeats.py
+++ b/data-pipeline/src/data_pipeline/pipelines/gnomad_v3_short_tandem_repeats.py
@@ -8,8 +8,8 @@
 pipeline.add_task(
     "prepare_short_tandem_repeats",
     prepare_gnomad_v3_short_tandem_repeats,
-    "/gnomad_v3/gnomad_v3_short_tandem_repeats.ht",
-    {"path": "gs://gcp-public-data--gnomad/release/3.1.3/json/gnomAD_STR_distributions__2022_01_20.json.gz"},
+    "/gnomad_v4/gnomad_v4_short_tandem_repeats.ht",
+    {"path": "gs://gnomad-browser-data-pipeline/phil-scratch/gnomAD_STR_distributions__gnomad-v2__2024_06_28.json"},
 )
 
 ###############################################

From 1395bf013b113b31ac2482f7ebe7baa8a697bc51 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 15 Jul 2024 16:27:14 -0400
Subject: [PATCH 02/36] DONTMERGE rig index

---
 graphql-api/src/queries/short-tandem-repeat-queries.ts | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/graphql-api/src/queries/short-tandem-repeat-queries.ts b/graphql-api/src/queries/short-tandem-repeat-queries.ts
index d4b1eb2d2..e883835d4 100644
--- a/graphql-api/src/queries/short-tandem-repeat-queries.ts
+++ b/graphql-api/src/queries/short-tandem-repeat-queries.ts
@@ -5,7 +5,8 @@ import { fetchAllSearchResults } from './helpers/elasticsearch-helpers'
 
 const SHORT_TANDEM_REPEAT_INDICES = {
   gnomad_r3: 'gnomad_v3_short_tandem_repeats',
-  gnomad_r4: 'gnomad_v3_short_tandem_repeats',
+  // TK
+  gnomad_r4: 'gnomad_v3_short_tandem_repeats-2024-07-15--17-34',
 }
 
 const SUMMARY_FIELDS = [

From 68b7e2c8b903295ff7794e8ff2e77e97ed2c457b Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 15 Jul 2024 16:45:50 -0400
Subject: [PATCH 03/36] Update GraphQL schema for STRs to reflect new ES schema

---
 .../graphql/types/short-tandem-repeat.graphql | 66 +++++++++----------
 1 file changed, 32 insertions(+), 34 deletions(-)

diff --git a/graphql-api/src/graphql/types/short-tandem-repeat.graphql b/graphql-api/src/graphql/types/short-tandem-repeat.graphql
index 52dd64ae0..2ba0f2caf 100644
--- a/graphql-api/src/graphql/types/short-tandem-repeat.graphql
+++ b/graphql-api/src/graphql/types/short-tandem-repeat.graphql
@@ -31,43 +31,39 @@ type ShortTandemRepeatRepeatUnit {
   classification: String!
 }
 
-type ShortTandemRepeatAlleleSizeDistributionPopulation {
-  id: String!
-  distribution: [[Int!]!]!
-}
-
-type ShortTandemRepeatAlleleSizeDistributionRepeatUnit {
-  repeat_unit: String!
-  distribution: [[Int!]!]!
-  populations: [ShortTandemRepeatAlleleSizeDistributionPopulation!]!
-}
-
-type ShortTandemRepeatAlleleSizeDistribution {
+type ShortTandemRepeatAgeDistributionBin {
+  age_range: [Int]!
   distribution: [[Int!]!]!
-  populations: [ShortTandemRepeatAlleleSizeDistributionPopulation!]!
-  repeat_units: [ShortTandemRepeatAlleleSizeDistributionRepeatUnit!]!
 }
 
-type ShortTandemRepeatGenotypeDistributionPopulation {
-  id: String!
-  distribution: [[Int!]!]!
+type ShortTandemRepeatAlleleSizeItem {
+  repunit_count: Int!
+  frequency: Int!
 }
 
-type ShortTandemRepeatGenotypeDistributionRepeatUnit {
-  repeat_units: [String!]!
-  distribution: [[Int!]!]!
-  populations: [ShortTandemRepeatGenotypeDistributionPopulation!]!
+type ShortTandemRepeatAlleleSizeDistributionCohort {
+  ancestry_group: String!
+  sex: String!
+  repunit: String!
+  quality_description: String!
+  q_score: Float!
+  distribution: [ShortTandemRepeatAlleleSizeItem!]!
 }
 
-type ShortTandemRepeatGenotypeDistribution {
-  distribution: [[Int!]!]!
-  populations: [ShortTandemRepeatGenotypeDistributionPopulation!]!
-  repeat_units: [ShortTandemRepeatGenotypeDistributionRepeatUnit!]!
+type ShortTandemRepeatGenotypeItem {
+  short_allele_repunit_count: Int!
+  long_allele_repunit_count: Int!
+  frequency: Int!
 }
 
-type ShortTandemRepeatAgeDistributionBin {
-  age_range: [Int]!
-  distribution: [[Int!]!]!
+type ShortTandemRepeatGenotypeDistributionCohort {
+  ancestry_group: String!
+  sex: String!
+  short_allele_repunit: String!
+  long_allele_repunit: String!
+  quality_description: String!
+  q_score: Float!
+  distribution: [ShortTandemRepeatGenotypeItem!]!
 }
 
 type ShortTandemRepeatAdjacentRepeat {
@@ -75,8 +71,8 @@ type ShortTandemRepeatAdjacentRepeat {
   reference_region: ShortTandemRepeatReferenceRegion!
   reference_repeat_unit: String!
   repeat_units: [String!]!
-  allele_size_distribution: ShortTandemRepeatAlleleSizeDistribution!
-  genotype_distribution: ShortTandemRepeatGenotypeDistribution!
+  allele_size_distribution: [ShortTandemRepeatAlleleSizeDistributionCohort!]!
+  genotype_distribution: [ShortTandemRepeatGenotypeDistributionCohort!]!
   age_distribution: [ShortTandemRepeatAgeDistributionBin!]
 }
 
@@ -85,7 +81,8 @@ type ShortTandemRepeat {
   gene: ShortTandemRepeatGene!
   associated_diseases: [ShortTandemRepeatAssociatedDisease!]!
   stripy_id: String!
-  reference_region: ShortTandemRepeatReferenceRegion!
+  main_reference_region: ShortTandemRepeatReferenceRegion!
+  reference_regions: [ShortTandemRepeatReferenceRegion!]!
   reference_repeat_unit: String!
 }
 
@@ -94,11 +91,12 @@ type ShortTandemRepeatDetails {
   gene: ShortTandemRepeatGene!
   associated_diseases: [ShortTandemRepeatAssociatedDisease!]!
   stripy_id: String
-  reference_region: ShortTandemRepeatReferenceRegion!
+  main_reference_region: ShortTandemRepeatReferenceRegion!
+  reference_regions: [ShortTandemRepeatReferenceRegion!]!
   reference_repeat_unit: String!
   repeat_units: [ShortTandemRepeatRepeatUnit!]!
-  allele_size_distribution: ShortTandemRepeatAlleleSizeDistribution!
-  genotype_distribution: ShortTandemRepeatGenotypeDistribution!
+  allele_size_distribution: [ShortTandemRepeatAlleleSizeDistributionCohort!]!
+  genotype_distribution: [ShortTandemRepeatGenotypeDistributionCohort!]!
   age_distribution: [ShortTandemRepeatAgeDistributionBin!]
   adjacent_repeats: [ShortTandemRepeatAdjacentRepeat!]!
 }

From 900e7465a83e0f5752ff993b96940cf9916c59de Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Wed, 17 Jul 2024 15:39:28 -0400
Subject: [PATCH 04/36] WIP pop options refactored

---
 browser/src/GenePage/GenePageContainer.tsx    |   2 +-
 .../src/RegionPage/RegionPageContainer.tsx    |   2 +-
 .../ShortTandemRepeatPage.tsx                 | 244 +++++++++---------
 .../ShortTandemRepeatPopulationOptions.tsx    |  71 +++--
 dataset-metadata/gnomadPopulations.ts         |   9 +-
 5 files changed, 155 insertions(+), 173 deletions(-)

diff --git a/browser/src/GenePage/GenePageContainer.tsx b/browser/src/GenePage/GenePageContainer.tsx
index e78711c20..6d0ecdb1b 100644
--- a/browser/src/GenePage/GenePageContainer.tsx
+++ b/browser/src/GenePage/GenePageContainer.tsx
@@ -263,7 +263,7 @@ query ${operationName}($geneId: String, $geneSymbol: String, $referenceGenome: R
   }
 }
 `
-
+// TK check
 type Props = {
   datasetId: DatasetId
   geneIdOrSymbol: string
diff --git a/browser/src/RegionPage/RegionPageContainer.tsx b/browser/src/RegionPage/RegionPageContainer.tsx
index 45da7c9a5..e468a7268 100644
--- a/browser/src/RegionPage/RegionPageContainer.tsx
+++ b/browser/src/RegionPage/RegionPageContainer.tsx
@@ -47,7 +47,7 @@ const query = `
     }
   }
 `
-
+// TK check
 type Props = {
   datasetId: DatasetId
   regionId: string
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 833e19460..7b4d7edda 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -25,48 +25,53 @@ import {
   getGenotypeDistributionPlotAxisLabels,
 } from './shortTandemRepeatHelpers'
 import ShortTandemRepeatAdjacentRepeatSection from './ShortTandemRepeatAdjacentRepeatSection'
+import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
-type ShortTandemRepeatRepeatUnit = {
-  repeat_unit: string
-  distribution: number[][]
-  populations: {
-    id: string
-    distribution: number[][]
-  }[]
+type ShortTandemRepeatReferenceRegion = {
+  chrom: string
+  start: number
+  stop: number
+}
+
+type AlleleSizeDistributionItem = {
+  repunit_count: number
+  frequency: number
+}
+
+export type Sex = '' | 'XX' | 'XY'
+
+type AlleleSizeDistributionCohort = {
+  ancestry_group: AncestryGroupId
+  sex: Sex
+  repunit: string
+  quality_description: string
+  q_score: number
+  distribution: AlleleSizeDistributionItem[]
+}
+
+type GenotypeDistributionItem = {
+  short_allele_repunit_count: number
+  long_allele_repunit_count: number
+  frequency: number
+}
+
+type GenotypeDistributionCohort = {
+  ancestry_group: string
+  sex: Sex
+  short_allele_repunit: string
+  long_allele_repunit: string
+  quality_description: string
+  q_score: number
+  distribution: GenotypeDistributionItem[]
 }
 
 export type ShortTandemRepeatAdjacentRepeat = {
   id: string
-  reference_region: {
-    chrom: string
-    start: number
-    stop: number
-  }
+  reference_region: ShortTandemRepeatReferenceRegion
   reference_repeat_unit: string
   repeat_units: string[]
-  allele_size_distribution: {
-    distribution: number[][]
-    populations: {
-      id: string
-      distribution: number[][]
-    }[]
-    repeat_units: ShortTandemRepeatRepeatUnit[]
-  }
-  genotype_distribution: {
-    distribution: number[][]
-    populations: {
-      id: string
-      distribution: number[][]
-    }[]
-    repeat_units: {
-      repeat_units: string[]
-      distribution: number[][]
-      populations: {
-        id: string
-        distribution: number[][]
-      }[]
-    }[]
-  }
+  allele_size_distribution: AlleleSizeDistributionCohort[]
+  genotype_distribution: GenotypeDistributionCohort[]
 }
 
 export type ShortTandemRepeat = {
@@ -89,39 +94,15 @@ export type ShortTandemRepeat = {
     notes: string | null
   }[]
   stripy_id: string | null
-  reference_region: {
-    chrom: string
-    start: number
-    stop: number
-  }
+  main_reference_region: ShortTandemRepeatReferenceRegion
+  reference_regions: ShortTandemRepeatReferenceRegion[]
   reference_repeat_unit: string
   repeat_units: {
     repeat_unit: string
     classification: string
   }[]
-  allele_size_distribution: {
-    distribution: number[][]
-    populations: {
-      id: string
-      distribution: number[][]
-    }[]
-    repeat_units: ShortTandemRepeatRepeatUnit[]
-  }
-  genotype_distribution: {
-    distribution: number[][]
-    populations: {
-      id: string
-      distribution: number[][]
-    }[]
-    repeat_units: {
-      repeat_units: string[]
-      distribution: number[][]
-      populations: {
-        id: string
-        distribution: number[][]
-      }[]
-    }[]
-  }
+  allele_size_distribution: AlleleSizeDistributionCohort[]
+  genotype_distribution: GenotypeDistributionCohort[]
   adjacent_repeats: ShortTandemRepeatAdjacentRepeat[]
 }
 
@@ -160,31 +141,44 @@ type ShortTandemRepeatPageProps = {
   shortTandemRepeat: ShortTandemRepeat
 }
 
-const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepeatPageProps) => {
-  const [selectedRepeatUnit, setSelectedRepeatUnit] = useState(
-    shortTandemRepeat.allele_size_distribution.repeat_units.length === 1
-      ? shortTandemRepeat.allele_size_distribution.repeat_units[0].repeat_unit
-      : ''
-  )
-
-  const [selectedPopulationId, setSelectedPopulationId] = useState('')
-  const [selectedScaleType, setSelectedScaleType] = useState('linear')
+type ScaleType = 'linear' | 'log'
 
+const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepeatPageProps) => {
+  const { allele_size_distribution, genotype_distribution } = shortTandemRepeat
+
+  const alleleSizeDistributionRepunits = allele_size_distribution
+    .map((cohort) => cohort.repunit)
+    .sort()
+  const genotypeDistributionRepunitPairs = genotype_distribution
+    .map((cohort) => [cohort.short_allele_repunit, cohort.long_allele_repunit].join(', '))
+    .sort()
+
+  const defaultAlleleSizeRepunit =
+    alleleSizeDistributionRepunits.length === 1 ? alleleSizeDistributionRepunits[0] : ''
+  const defaultGenotypeDistributionRepunits =
+    genotypeDistributionRepunitPairs.length === 1 ? genotypeDistributionRepunitPairs[0] : ''
+  const defaultDisease = shortTandemRepeat.associated_diseases[0].name
+
+  const [selectedAncestryGroup, setSelectedAncestryGroup] = useState<string>('')
+  const [selectedSex, setSelectedSex] = useState<Sex>('')
+  const [selectedAlleleSizeRepeatUnit, setSelectedAlleleSizeRepeatUnit] =
+    useState<string>(defaultAlleleSizeRepunit)
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
-    useState(
-      shortTandemRepeat.genotype_distribution.repeat_units.length === 1
-        ? shortTandemRepeat.genotype_distribution.repeat_units[0].repeat_units.join(' / ')
-        : ''
+    useState<string>(defaultGenotypeDistributionRepunits)
+  const [selectedDisease, setSelectedDisease] = useState<string>(defaultDisease)
+  const [selectedScaleType, setSelectedScaleType] = useState<ScaleType>('linear')
+  const [showAdjacentRepeats, setShowAdjacentRepeats] = useState<boolean>(false)
+
+  const ancestryGroups = [
+    ...new Set(shortTandemRepeat.allele_size_distribution.map((cohort) => cohort.ancestry_group)),
+  ].sort()
+
+  const maxAlleleSizeDistributionRepeats = Math.max(
+    ...shortTandemRepeat.allele_size_distribution.flatMap((cohort) =>
+      cohort.distribution.map((item) => item.repunit_count)
     )
-
-  const [selectedDisease, setSelectedDisease] = useState(
-    shortTandemRepeat.associated_diseases[0].name
   )
 
-  const [showAdjacentRepeats, setShowAdjacentRepeats] = useState(false)
-
-  const populationIds = shortTandemRepeat.allele_size_distribution.populations.map((pop) => pop.id)
-
   const allRepeatUnitsByClassification: Record<string, string[]> = {}
   shortTandemRepeat.repeat_units.forEach((repeatUnit) => {
     if (allRepeatUnitsByClassification[repeatUnit.classification] === undefined) {
@@ -196,9 +190,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
   // This uses repeat units from shortTandemRepeat.allele_size_distribution.repeat_units because
   // shortTandemRepeat.repeat_units may include repeat units that do not appear in gnomAD.
   const repeatUnitsFoundInGnomad = new Set(
-    shortTandemRepeat.allele_size_distribution.repeat_units.map(
-      (repeatUnit) => repeatUnit.repeat_unit
-    )
+    shortTandemRepeat.allele_size_distribution.map((cohort) => cohort.repunit)
   )
 
   const repeatUnitsFoundInGnomadByClassification: Record<string, string[]> = {}
@@ -283,25 +275,22 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         </h2>
         <ShortTandemRepeatAlleleSizeDistributionPlot
           // @ts-expect-error TS(2322) FIXME: Type '{ maxRepeats: number; alleleSizeDistribution... Remove this comment to see the full error message
-          maxRepeats={
-            shortTandemRepeat.allele_size_distribution.distribution[
-              shortTandemRepeat.allele_size_distribution.distribution.length - 1
-            ][0]
-          }
+          maxRepeats={maxAlleleSizeDistributionRepeats}
           alleleSizeDistribution={getSelectedAlleleSizeDistribution(shortTandemRepeat, {
-            selectedPopulationId,
-            selectedRepeatUnit,
+            selectedAncestryGroup,
+            selectedRepeatUnit: selectedAlleleSizeRepeatUnit,
           })}
           repeatUnitLength={
-            selectedRepeatUnit && !selectedRepeatUnit.startsWith('classification')
-              ? selectedRepeatUnit.length
+            selectedAlleleSizeRepeatUnit &&
+            !selectedAlleleSizeRepeatUnit.startsWith('classification')
+              ? selectedAlleleSizeRepeatUnit.length
               : null
           }
           ranges={
-            (selectedRepeatUnit === '' && allRepeatUnitsFoundInGnomadArePathogenic) ||
-            selectedRepeatUnit === 'classification/pathogenic' ||
+            (selectedAlleleSizeRepeatUnit === '' && allRepeatUnitsFoundInGnomadArePathogenic) ||
+            selectedAlleleSizeRepeatUnit === 'classification/pathogenic' ||
             ((repeatUnitsFoundInGnomadByClassification as any).pathogenic || []).includes(
-              selectedRepeatUnit
+              selectedAlleleSizeRepeatUnit
             )
               ? plotRanges
               : []
@@ -311,28 +300,29 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         <ControlSection style={{ marginTop: '0.5em' }}>
           <ShortTandemRepeatPopulationOptions
             id={`${shortTandemRepeat.id}-repeat-counts`}
-            populationIds={populationIds}
-            selectedPopulationId={selectedPopulationId}
-            onSelectPopulationId={setSelectedPopulationId}
+            ancestryGroups={ancestryGroups}
+            selectedAncestryGroup={selectedAncestryGroup}
+            selectedSex={selectedSex}
+            setSelectedAncestryGroup={setSelectedAncestryGroup}
+            setSelectedSex={setSelectedSex}
           />
 
           <label htmlFor={`short-tandem-repeat-${shortTandemRepeat.id}-repeat-unit`}>
             Repeat unit: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
             <Select
               id={`short-tandem-repeat-${shortTandemRepeat.id}-repeat-unit`}
-              value={selectedRepeatUnit}
+              value={selectedAlleleSizeRepeatUnit}
               onChange={(e: any) => {
-                setSelectedRepeatUnit(e.target.value)
+                setSelectedAlleleSizeRepeatUnit(e.target.value)
               }}
             >
-              {shortTandemRepeat.allele_size_distribution.repeat_units.length === 1 ? (
-                <>
-                  {shortTandemRepeat.allele_size_distribution.repeat_units.map((repeatUnit) => (
-                    <option key={repeatUnit.repeat_unit} value={repeatUnit.repeat_unit}>
-                      {repeatUnit.repeat_unit}
-                    </option>
-                  ))}
-                </>
+              {alleleSizeDistributionRepunits.length === 1 ? (
+                <option
+                  key={alleleSizeDistributionRepunits[0]}
+                  value={alleleSizeDistributionRepunits[0]}
+                >
+                  {alleleSizeDistributionRepunits[0]}
+                </option>
               ) : (
                 <>
                   <option value="">All</option>
@@ -436,9 +426,11 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         )}
 
         {!(
-          (selectedRepeatUnit === '' && allRepeatUnitsFoundInGnomadArePathogenic) ||
-          selectedRepeatUnit === 'classification/pathogenic' ||
-          ((allRepeatUnitsByClassification as any).pathogenic || []).includes(selectedRepeatUnit)
+          (selectedAlleleSizeRepeatUnit === '' && allRepeatUnitsFoundInGnomadArePathogenic) ||
+          selectedAlleleSizeRepeatUnit === 'classification/pathogenic' ||
+          ((allRepeatUnitsByClassification as any).pathogenic || []).includes(
+            selectedAlleleSizeRepeatUnit
+          )
         ) && (
           <p style={{ marginBottom: 0 }}>
             <Badge level="info">Note</Badge> This plot includes non-pathogenic repeat units. Use the
@@ -466,7 +458,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           ]}
           genotypeDistribution={getSelectedGenotypeDistribution(shortTandemRepeat, {
             selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
-            selectedPopulationId,
+            selectedAncestryGroup,
           })}
           xRanges={
             (selectedGenotypeDistributionRepeatUnits === '' &&
@@ -496,8 +488,8 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           <ShortTandemRepeatPopulationOptions
             id={`${shortTandemRepeat.id}-genotype-distribution`}
             populationIds={populationIds}
-            selectedPopulationId={selectedPopulationId}
-            onSelectPopulationId={setSelectedPopulationId}
+            selectedPopulationId={selectedAncestryGroup}
+            onSelectPopulationId={setSelectedAncestryGroup}
           />
 
           <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
@@ -558,7 +550,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         >
           <ShortTandemRepeatGenotypeDistributionBinDetails
             shortTandemRepeatOrAdjacentRepeat={shortTandemRepeat}
-            selectedPopulationId={selectedPopulationId}
+            selectedPopulationId={selectedAncestryGroup}
             selectedRepeatUnits={selectedGenotypeDistributionRepeatUnits}
             bin={selectedGenotypeDistributionBin}
           />
@@ -572,11 +564,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         <ShortTandemRepeatAgeDistributionPlot
           // @ts-expect-error TS(2322) FIXME: Type '{ ageDistribution: any; maxRepeats: number; ... Remove this comment to see the full error message
           ageDistribution={(shortTandemRepeat as any).age_distribution}
-          maxRepeats={
-            shortTandemRepeat.allele_size_distribution.distribution[
-              shortTandemRepeat.allele_size_distribution.distribution.length - 1
-            ][0]
-          }
+          maxRepeats={maxAlleleSizeDistributionRepeats}
           ranges={allRepeatUnitsFoundInGnomadArePathogenic ? plotRanges : []}
         />
         {!allRepeatUnitsFoundInGnomadArePathogenic && (
@@ -598,8 +586,8 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
                   key={adjacentRepeat.id}
                   adjacentRepeat={adjacentRepeat}
                   populationIds={populationIds}
-                  selectedPopulationId={selectedPopulationId}
-                  onSelectPopulationId={setSelectedPopulationId}
+                  selectedPopulationId={selectedAncestryGroup}
+                  onSelectPopulationId={setSelectedAncestryGroup}
                   selectedScaleType={selectedScaleType}
                   onSelectScaleType={setSelectedScaleType}
                 />
@@ -633,15 +621,15 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           <ShortTandemRepeatPopulationOptions
             id={`${shortTandemRepeat.id}-read-data`}
             populationIds={populationIds}
-            selectedPopulationId={selectedPopulationId}
-            onSelectPopulationId={setSelectedPopulationId}
+            selectedPopulationId={selectedAncestryGroup}
+            onSelectPopulationId={setSelectedAncestryGroup}
           />
         </ControlSection>
         <ShortTandemRepeatReads
           datasetId={datasetId}
           shortTandemRepeat={shortTandemRepeat}
           filter={{
-            ...parseCombinedPopulationId(selectedPopulationId),
+            ...parseCombinedPopulationId(selectedAncestryGroup),
           }}
         />
       </section>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
index f217fc478..b8f041dbe 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
@@ -1,9 +1,14 @@
-import React from 'react'
+import React, { Dispatch, SetStateAction } from 'react'
 import styled from 'styled-components'
 
 import { Select } from '@gnomad/ui'
 
-import { GNOMAD_POPULATION_NAMES } from '@gnomad/dataset-metadata/gnomadPopulations'
+import {
+  AncestryGroupId,
+  GNOMAD_ANCESTRY_GROUP_NAMES,
+} from '@gnomad/dataset-metadata/gnomadPopulations'
+
+import { Sex } from './ShortTandemRepeatPage'
 
 const Wrapper = styled.div`
   @media (max-width: 600px) {
@@ -19,28 +24,24 @@ const Wrapper = styled.div`
 
 type Props = {
   id: string
-  populationIds: string[]
-  selectedPopulationId: string
-  onSelectPopulationId: (...args: any[]) => any
+  ancestryGroups: AncestryGroupId[]
+  selectedAncestryGroup: AncestryGroupId
+  selectedSex: string
+  setSelectedAncestryGroup: Dispatch<SetStateAction<AncestryGroupId>>
+  setSelectedSex: Dispatch<SetStateAction<Sex>>
 }
 
 const ShortTandemRepeatPopulationOptions = ({
   id,
-  populationIds,
-  selectedPopulationId,
-  onSelectPopulationId,
+  ancestryGroups,
+  selectedAncestryGroup,
+  selectedSex,
+  setSelectedAncestryGroup,
+  setSelectedSex,
 }: Props) => {
-  const selectedAncestralPopulation =
-    selectedPopulationId === 'XX' || selectedPopulationId === 'XY'
-      ? ''
-      : selectedPopulationId.split('_')[0]
-
-  let selectedSex = ''
-  if (selectedPopulationId.endsWith('XX')) {
-    selectedSex = 'XX'
-  } else if (selectedPopulationId.endsWith('XY')) {
-    selectedSex = 'XY'
-  }
+  const ancestryGroupsSortedByName = ancestryGroups.sort((group1, group2) =>
+    GNOMAD_ANCESTRY_GROUP_NAMES[group1].localeCompare(GNOMAD_ANCESTRY_GROUP_NAMES[group2])
+  )
 
   return (
     <Wrapper>
@@ -49,36 +50,24 @@ const ShortTandemRepeatPopulationOptions = ({
         {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
         <Select
           id={`short-tandem-repeat-${id}-population-options-population`}
-          value={selectedAncestralPopulation}
-          onChange={(e: any) => {
-            onSelectPopulationId([e.target.value, selectedSex].filter(Boolean).join('_'))
-          }}
+          value={selectedAncestryGroup}
+          onChange={setSelectedAncestryGroup}
         >
           <option value="">Global</option>
-          {populationIds
-            .filter((popId) => !(popId.endsWith('XX') || popId.endsWith('XY')))
-            .sort((pop1, pop2) =>
-              // @ts-expect-error TS(7053) FIXME: Element implicitly has an 'any' type because expre... Remove this comment to see the full error message
-              GNOMAD_POPULATION_NAMES[pop1].localeCompare(GNOMAD_POPULATION_NAMES[pop2])
-            )
-            .map((popId) => (
-              <option key={popId} value={popId}>
-                {/* @ts-expect-error TS(7053) FIXME: Element implicitly has an 'any' type because expre... Remove this comment to see the full error message */}
-                {GNOMAD_POPULATION_NAMES[popId]}
-              </option>
-            ))}
+          {ancestryGroupsSortedByName.map((ancestryGroup) => (
+            <option key={ancestryGroup} value={ancestryGroup}>
+              {GNOMAD_ANCESTRY_GROUP_NAMES[ancestryGroup]}
+            </option>
+          ))}
         </Select>
-      </label>{' '}
+      </label>
+
       <label htmlFor={`short-tandem-repeat-${id}-population-options-sex`}>
         Sex: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
         <Select
           id={`short-tandem-repeat-${id}-population-options-sex`}
           value={selectedSex}
-          onChange={(e: any) => {
-            onSelectPopulationId(
-              [selectedAncestralPopulation, e.target.value].filter(Boolean).join('_')
-            )
-          }}
+          onChange={setSelectedSex}
         >
           <option value="">All</option>
           <option value="XX">XX</option>
diff --git a/dataset-metadata/gnomadPopulations.ts b/dataset-metadata/gnomadPopulations.ts
index 480cb2d6d..370d8c4a3 100644
--- a/dataset-metadata/gnomadPopulations.ts
+++ b/dataset-metadata/gnomadPopulations.ts
@@ -1,7 +1,7 @@
 import { textOrMissingTextWarning } from '../browser/src/missingContent'
 import { DatasetId, getTopLevelDataset } from './metadata'
 
-export const GNOMAD_POPULATION_NAMES = {
+export const GNOMAD_ANCESTRY_GROUP_NAMES = {
   afr: 'African/African American',
   ami: 'Amish',
   amr: 'Admixed American',
@@ -30,7 +30,12 @@ export const GNOMAD_POPULATION_NAMES = {
   nfe_swe: 'Swedish',
 } as const
 
-export type PopulationId = keyof typeof GNOMAD_POPULATION_NAMES
+export type AncestryGroupId = keyof typeof GNOMAD_ANCESTRY_GROUP_NAMES
+
+// Temporary definitions so we can use the new names in new code without having
+// to immediately update all uses of the old (deprecated) names.
+export type PopulationId = AncestryGroupId
+export const GNOMAD_POPULATION_NAMES = GNOMAD_ANCESTRY_GROUP_NAMES
 
 export type PopulationIdAndChromosome =
   | PopulationId

From d514db83689e76df381336e86d9f7f8355d170b4 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 22 Jul 2024 11:41:12 -0400
Subject: [PATCH 05/36] WIP that should be the allele size plot

---
 ...TandemRepeatAlleleSizeDistributionPlot.tsx | 82 ++++++-----------
 ...rtTandemRepeatGenotypeDistributionPlot.tsx | 88 +++++++------------
 .../ShortTandemRepeatPage.tsx                 | 42 +++++----
 .../ShortTandemRepeatPopulationOptions.tsx    |  8 +-
 .../shortTandemRepeatHelpers.ts               | 62 +++++++++----
 5 files changed, 138 insertions(+), 144 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index 392583544..88ab31647 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -1,12 +1,12 @@
 import { max } from 'd3-array'
 import { scaleBand, scaleLinear, scaleLog } from 'd3-scale'
-import PropTypes from 'prop-types'
 import React, { useMemo } from 'react'
 import { withSize } from 'react-sizeme'
 import styled from 'styled-components'
 import { AxisBottom, AxisLeft } from '@visx/axis'
 
 import { TooltipAnchor } from '@gnomad/ui'
+import { AlleleSizeDistributionItem, ScaleType } from './ShortTandemRepeatPage'
 
 // The 100% width/height container is necessary the component
 // to size to fit its container vs staying at its initial size.
@@ -24,7 +24,7 @@ const TooltipTrigger = styled.rect`
   }
 `
 
-const tickFormat = (n: any) => {
+const tickFormat = (n: number) => {
   if (n >= 1e9) {
     return `${(n / 1e9).toPrecision(3)}B`
   }
@@ -40,23 +40,28 @@ const tickFormat = (n: any) => {
 const labelProps = {
   fontSize: 14,
   textAnchor: 'middle',
+} as const
+
+type Range = { start: number; stop: number; label: string }
+
+type Props = {
+  maxRepeats: number
+  alleleSizeDistribution: AlleleSizeDistributionItem[]
+  repeatUnitLength: number
+  scaleType: ScaleType
+  ranges: Range[]
+  size: { width: number }
 }
 
 const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
   ({
-    // @ts-expect-error TS(2339) FIXME: Property 'maxRepeats' does not exist on type '{}'.
     maxRepeats,
-    // @ts-expect-error TS(2339) FIXME: Property 'alleleSizeDistribution' does not exist o... Remove this comment to see the full error message
     alleleSizeDistribution,
-    // @ts-expect-error TS(2339) FIXME: Property 'repeatUnitLength' does not exist on type... Remove this comment to see the full error message
     repeatUnitLength,
-    // @ts-expect-error TS(2339) FIXME: Property 'size' does not exist on type '{}'.
     size: { width },
-    // @ts-expect-error TS(2339) FIXME: Property 'scaleType' does not exist on type '{}'.
-    scaleType,
-    // @ts-expect-error TS(2339) FIXME: Property 'ranges' does not exist on type '{}'.
-    ranges,
-  }) => {
+    scaleType = 'linear',
+    ranges = [],
+  }: Props) => {
     const height = 300
 
     const margin = {
@@ -79,16 +84,15 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
         count: 0,
       }))
 
-      // @ts-expect-error TS(7031) FIXME: Binding element 'repeatCount' implicitly has an 'a... Remove this comment to see the full error message
-      alleleSizeDistribution.forEach(([repeatCount, nAlleles]) => {
-        const binIndex = Math.floor(repeatCount / binSize)
-        d[binIndex].count += nAlleles
+      alleleSizeDistribution.forEach(({ repunit_count, frequency }) => {
+        const binIndex = Math.floor(repunit_count / binSize)
+        d[binIndex].count += frequency
       })
 
       return d
     }, [alleleSizeDistribution, nBins, binSize])
 
-    const xScale = scaleBand()
+    const xScale = scaleBand<number>()
       .domain(data.map((d: any) => d.binIndex))
       .range([0, plotWidth])
 
@@ -117,8 +121,7 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
         const readLengthBinIndex = Math.floor(readLengthInRepeats / binSize)
         // Read length line should be drawn at the center of the range for its value.
         readLengthX =
-          // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-          xScale(readLengthBinIndex) +
+          (xScale(readLengthBinIndex) || 0) +
           ((readLengthInRepeats - readLengthBinIndex * binSize) / binSize) * xBandwidth +
           xBandwidth / binSize / 2
       }
@@ -130,14 +133,12 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
           <AxisBottom
             label="Repeats"
             labelOffset={binSize === 1 ? 10 : 30}
-            // @ts-expect-error TS(2322) FIXME: Type '{ fontSize: number; textAnchor: string; }' i... Remove this comment to see the full error message
             labelProps={labelProps}
             left={margin.left}
             scale={xScale}
             stroke="#333"
-            tickFormat={(binIndex) =>
-              // @ts-expect-error TS(7015) FIXME: Element implicitly has an 'any' type because index... Remove this comment to see the full error message
-              (binIndex as any) % labelInterval === 0 ? data[binIndex].label : ''
+            tickFormat={(binIndex: number) =>
+              binIndex % labelInterval === 0 ? data[binIndex].label : ''
             }
             tickLabelProps={
               binSize === 1
@@ -157,8 +158,7 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
                       fontSize: 10,
                       textAnchor: 'end',
                       transform: `translate(0, 0), rotate(-40 ${
-                        // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                        xScale(binIndex) + xBandwidth / 2
+                        (xScale(binIndex) || 0) + xBandwidth / 2
                       }, 0)`,
                     }
                   }
@@ -168,7 +168,6 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
           <AxisLeft
             label="Alleles"
             labelOffset={40}
-            // @ts-expect-error TS(2322) FIXME: Type '{ fontSize: number; textAnchor: string; }' i... Remove this comment to see the full error message
             labelProps={labelProps}
             left={margin.left}
             numTicks={scaleType === 'log' ? 10 : Math.min(10, yScale.domain()[1])}
@@ -176,9 +175,9 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
             stroke="#333"
             tickFormat={
               scaleType === 'log'
-                ? // @ts-expect-error TS(2345) FIXME: Argument of type 'unknown' is not assignable to pa... Remove this comment to see the full error message
-                  (n) => (Number.isInteger(Math.log10(n)) ? tickFormat(n) : '')
-                : tickFormat
+                ? (n: unknown) =>
+                    Number.isInteger(Math.log10(n as number)) ? tickFormat(n as number) : ''
+                : (n: unknown) => tickFormat(n as number)
             }
             tickLabelProps={() => ({
               dx: '-0.25em',
@@ -239,15 +238,13 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
               .map((range: any, rangeIndex: any) => {
                 const startBinIndex = Math.floor(range.start / binSize)
                 const startX =
-                  // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                  xScale(startBinIndex) +
+                  (xScale(startBinIndex) || 0) +
                   ((range.start - startBinIndex * binSize) / binSize) * xBandwidth
                 let stopX
                 if (range.stop <= maxRepeats) {
                   const stopBinIndex = Math.floor(range.stop / binSize)
                   stopX =
-                    // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                    xScale(stopBinIndex) +
+                    (xScale(stopBinIndex) || 0) +
                     ((range.stop - stopBinIndex * binSize) / binSize) * xBandwidth
                 } else {
                   stopX = plotWidth
@@ -350,25 +347,4 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
 ShortTandemRepeatAlleleSizeDistributionPlot.displayName =
   'ShortTandemRepeatAlleleSizeDistributionPlot'
 
-ShortTandemRepeatAlleleSizeDistributionPlot.propTypes = {
-  // @ts-expect-error TS(2322) FIXME: Type '{ maxRepeats: PropTypes.Validator<number>; a... Remove this comment to see the full error message
-  maxRepeats: PropTypes.number.isRequired,
-  alleleSizeDistribution: PropTypes.arrayOf(PropTypes.arrayOf(PropTypes.number)).isRequired,
-  repeatUnitLength: PropTypes.number,
-  scaleType: PropTypes.oneOf(['linear', 'log']),
-  ranges: PropTypes.arrayOf(
-    PropTypes.shape({
-      start: PropTypes.number.isRequired,
-      stop: PropTypes.number.isRequired,
-      label: PropTypes.string.isRequired,
-    })
-  ),
-}
-
-ShortTandemRepeatAlleleSizeDistributionPlot.defaultProps = {
-  // @ts-expect-error TS(2322) FIXME: Type '{ scaleType: string; ranges: never[]; }' is ... Remove this comment to see the full error message
-  scaleType: 'linear',
-  ranges: [],
-}
-
 export default ShortTandemRepeatAlleleSizeDistributionPlot
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
index 7ce7ef7d4..a6e170bf2 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
@@ -1,6 +1,5 @@
 import { max } from 'd3-array'
 import { scaleBand, scaleLog } from 'd3-scale'
-import PropTypes from 'prop-types'
 import React from 'react'
 import { withSize } from 'react-sizeme'
 import styled from 'styled-components'
@@ -19,25 +18,39 @@ const GraphWrapper = styled.div`
 const labelProps = {
   fontSize: 14,
   textAnchor: 'middle',
+} as const
+
+type PlotRange = { start: number; stop: number; label: string }
+
+type Props = {
+  axisLabels: string[]
+  maxRepeats: number[]
+  genotypeDistribution: never
+  xRanges: PlotRange[]
+  yRanges: PlotRange[]
+  onSelectBin: (bin: Bin) => void
+  size: { width: number }
+}
+
+export type Bin = {
+  label: string
+  xBinIndex: number
+  yBinIndex: number
+  xRange: number[]
+  yRange: number[]
+  count: number
 }
 
 const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
   ({
-    // @ts-expect-error TS(2339) FIXME: Property 'axisLabels' does not exist on type '{}'.
     axisLabels,
-    // @ts-expect-error TS(2339) FIXME: Property 'maxRepeats' does not exist on type '{}'.
     maxRepeats,
-    // @ts-expect-error TS(2339) FIXME: Property 'genotypeDistribution' does not exist on ... Remove this comment to see the full error message
     genotypeDistribution,
-    // @ts-expect-error TS(2339) FIXME: Property 'size' does not exist on type '{}'.
     size: { width },
-    // @ts-expect-error TS(2339) FIXME: Property 'xRanges' does not exist on type '{}'.
-    xRanges,
-    // @ts-expect-error TS(2339) FIXME: Property 'yRanges' does not exist on type '{}'.
-    yRanges,
-    // @ts-expect-error TS(2339) FIXME: Property 'onSelectBin' does not exist on type '{}'... Remove this comment to see the full error message
-    onSelectBin,
-  }) => {
+    xRanges = [],
+    yRanges = [],
+    onSelectBin = () => {},
+  }: Props) => {
     const height = Math.min(width, 500)
 
     const margin = {
@@ -78,7 +91,7 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
           ? `${yBinIndex}`
           : `${yBinIndex * yBinSize} - ${yBinIndex * yBinSize + yBinSize - 1}`
 
-      return {
+      const result: Bin = {
         label: `${xLabel} repeats in ${axisLabels[0]} / ${yLabel} repeats in ${axisLabels[1]}`,
         xBinIndex,
         yBinIndex,
@@ -86,23 +99,21 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
         yRange,
         count: 0,
       }
+      return result
     })
 
-    // @ts-expect-error TS(7031) FIXME: Binding element 'repeats1' implicitly has an 'any'... Remove this comment to see the full error message
     genotypeDistribution.forEach(([repeats1, repeats2, nAlleles]) => {
       const xBinIndex = Math.floor(repeats1 / xBinSize)
       const yBinIndex = Math.floor(repeats2 / yBinSize)
       data[xBinIndex * yNumBins + yBinIndex].count += nAlleles
     })
 
-    const xScale = scaleBand()
-      // @ts-expect-error TS(2345) FIXME: Argument of type 'number[]' is not assignable to p... Remove this comment to see the full error message
+    const xScale = scaleBand<number>()
       .domain(Array.from(Array(xNumBins).keys()))
       .range([0, plotWidth])
     const xBandwidth = xScale.bandwidth()
 
-    const yScale = scaleBand()
-      // @ts-expect-error TS(2345) FIXME: Argument of type 'number[]' is not assignable to p... Remove this comment to see the full error message
+    const yScale = scaleBand<number>()
       .domain(Array.from(Array(yNumBins).keys()))
       .range([plotHeight, 0])
     const yBandwidth = yScale.bandwidth()
@@ -131,7 +142,6 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
     }
 
     const opacityScale = scaleLog()
-      // @ts-expect-error TS(2345) FIXME: Argument of type '(string | number | undefined)[]'... Remove this comment to see the full error message
       .domain([1, max(genotypeDistribution, (d: any) => d[2])])
       .range([0.1, 1])
 
@@ -141,7 +151,6 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
           <AxisBottom
             label={`Repeats in ${axisLabels[0]}`}
             labelOffset={xBinSize === 1 ? 10 : 30}
-            // @ts-expect-error TS(2322) FIXME: Type '{ fontSize: number; textAnchor: string; }' i... Remove this comment to see the full error message
             labelProps={labelProps}
             left={margin.left}
             scale={xScale}
@@ -165,8 +174,7 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
                       fontSize: 10,
                       textAnchor: 'end',
                       transform: `translate(0, 0), rotate(-40 ${
-                        // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                        xScale(binIndex) + xBandwidth / 2
+                        (xScale(binIndex) || 0) + xBandwidth / 2
                       }, 0)`,
                     }
                   }
@@ -176,7 +184,6 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
           <AxisLeft
             label={`Repeats in ${axisLabels[1]}`}
             labelOffset={60}
-            // @ts-expect-error TS(2322) FIXME: Type '{ fontSize: number; textAnchor: string; }' i... Remove this comment to see the full error message
             labelProps={labelProps}
             left={margin.left}
             scale={yScale}
@@ -235,16 +242,14 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
               .map((range: any, rangeIndex: any, ranges: any) => {
                 const startBinIndex = Math.floor(range.start / xBinSize)
                 const startX =
-                  // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                  xScale(startBinIndex) +
+                  (xScale(startBinIndex) || 0) +
                   ((range.start - startBinIndex * xBinSize) / xBinSize) * xBandwidth
 
                 let stopX
                 if (range.stop <= maxRepeats[0]) {
                   const stopBinIndex = Math.floor(range.stop / xBinSize)
                   stopX =
-                    // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                    xScale(stopBinIndex) +
+                    (xScale(stopBinIndex) || 0) +
                     ((range.stop - stopBinIndex * xBinSize) / xBinSize) * xBandwidth
                 } else {
                   stopX = plotWidth
@@ -324,16 +329,14 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
               .map((range: any, rangeIndex: any, ranges: any) => {
                 const startBinIndex = Math.floor(range.start / yBinSize)
                 const startY =
-                  // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                  yScale(startBinIndex) +
+                  (yScale(startBinIndex) || 0) +
                   (1 - (range.start - startBinIndex * yBinSize) / yBinSize) * yBandwidth
 
                 let stopY
                 if (range.stop <= maxRepeats[1]) {
                   const stopBinIndex = Math.floor(range.stop / yBinSize)
                   stopY =
-                    // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                    yScale(stopBinIndex) +
+                    (yScale(stopBinIndex) || 0) +
                     (1 - (range.stop - stopBinIndex * yBinSize) / yBinSize) * yBandwidth
                 } else {
                   stopY = 0
@@ -403,30 +406,7 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
 
 ShortTandemRepeatGenotypeDistributionPlot.displayName = 'ShortTandemRepeatGenotypeDistributionPlot'
 
-ShortTandemRepeatGenotypeDistributionPlot.propTypes = {
-  // @ts-expect-error TS(2322) FIXME: Type '{ axisLabels: PropTypes.Validator<(string | ... Remove this comment to see the full error message
-  axisLabels: PropTypes.arrayOf(PropTypes.string).isRequired,
-  maxRepeats: PropTypes.arrayOf(PropTypes.number).isRequired,
-  genotypeDistribution: PropTypes.arrayOf(PropTypes.arrayOf(PropTypes.number)).isRequired,
-  xRanges: PropTypes.arrayOf(
-    PropTypes.shape({
-      start: PropTypes.number.isRequired,
-      stop: PropTypes.number.isRequired,
-      label: PropTypes.string.isRequired,
-    })
-  ),
-  yRanges: PropTypes.arrayOf(
-    PropTypes.shape({
-      start: PropTypes.number.isRequired,
-      stop: PropTypes.number.isRequired,
-      label: PropTypes.string.isRequired,
-    })
-  ),
-  onSelectBin: PropTypes.func,
-}
-
 ShortTandemRepeatGenotypeDistributionPlot.defaultProps = {
-  // @ts-expect-error TS(2322) FIXME: Type '{ xRanges: never[]; yRanges: never[]; onSele... Remove this comment to see the full error message
   xRanges: [],
   yRanges: [],
   onSelectBin: () => {},
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 7b4d7edda..e2ad9d95c 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -15,7 +15,9 @@ import ShortTandemRepeatAssociatedDiseasesTable from './ShortTandemRepeatAssocia
 import ShortTandemRepeatAttributes from './ShortTandemRepeatAttributes'
 import ShortTandemRepeatPopulationOptions from './ShortTandemRepeatPopulationOptions'
 import ShortTandemRepeatAlleleSizeDistributionPlot from './ShortTandemRepeatAlleleSizeDistributionPlot'
-import ShortTandemRepeatGenotypeDistributionPlot from './ShortTandemRepeatGenotypeDistributionPlot'
+import ShortTandemRepeatGenotypeDistributionPlot, {
+  Bin as GenotypeBin,
+} from './ShortTandemRepeatGenotypeDistributionPlot'
 import ShortTandemRepeatGenotypeDistributionBinDetails from './ShortTandemRepeatGenotypeDistributionBinDetails'
 import ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect from './ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect'
 import ShortTandemRepeatReads from './ShortTandemRepeatReads'
@@ -33,14 +35,14 @@ type ShortTandemRepeatReferenceRegion = {
   stop: number
 }
 
-type AlleleSizeDistributionItem = {
+export type AlleleSizeDistributionItem = {
   repunit_count: number
   frequency: number
 }
 
-export type Sex = '' | 'XX' | 'XY'
+export type Sex = 'XX' | 'XY'
 
-type AlleleSizeDistributionCohort = {
+export type AlleleSizeDistributionCohort = {
   ancestry_group: AncestryGroupId
   sex: Sex
   repunit: string
@@ -141,7 +143,7 @@ type ShortTandemRepeatPageProps = {
   shortTandemRepeat: ShortTandemRepeat
 }
 
-type ScaleType = 'linear' | 'log'
+export type ScaleType = 'linear' | 'log'
 
 const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepeatPageProps) => {
   const { allele_size_distribution, genotype_distribution } = shortTandemRepeat
@@ -159,8 +161,8 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
     genotypeDistributionRepunitPairs.length === 1 ? genotypeDistributionRepunitPairs[0] : ''
   const defaultDisease = shortTandemRepeat.associated_diseases[0].name
 
-  const [selectedAncestryGroup, setSelectedAncestryGroup] = useState<string>('')
-  const [selectedSex, setSelectedSex] = useState<Sex>('')
+  const [selectedAncestryGroup, setSelectedAncestryGroup] = useState<AncestryGroupId | ''>('')
+  const [selectedSex, setSelectedSex] = useState<Sex | ''>('')
   const [selectedAlleleSizeRepeatUnit, setSelectedAlleleSizeRepeatUnit] =
     useState<string>(defaultAlleleSizeRepunit)
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
@@ -224,7 +226,8 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
     }
   })
 
-  const [selectedGenotypeDistributionBin, setSelectedGenotypeDistributionBin] = useState(null)
+  const [selectedGenotypeDistributionBin, setSelectedGenotypeDistributionBin] =
+    useState<GenotypeBin | null>(null)
 
   return (
     <>
@@ -274,10 +277,10 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           Allele Size Distribution <InfoButton topic="str-allele-size-distribution" />
         </h2>
         <ShortTandemRepeatAlleleSizeDistributionPlot
-          // @ts-expect-error TS(2322) FIXME: Type '{ maxRepeats: number; alleleSizeDistribution... Remove this comment to see the full error message
           maxRepeats={maxAlleleSizeDistributionRepeats}
           alleleSizeDistribution={getSelectedAlleleSizeDistribution(shortTandemRepeat, {
             selectedAncestryGroup,
+            selectedSex,
             selectedRepeatUnit: selectedAlleleSizeRepeatUnit,
           })}
           repeatUnitLength={
@@ -478,7 +481,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
               ? plotRanges
               : []
           }
-          onSelectBin={(bin: any) => {
+          onSelectBin={(bin: GenotypeBin) => {
             if (bin.xRange[0] !== bin.xRange[1] || bin.yRange[0] !== bin.yRange[1]) {
               setSelectedGenotypeDistributionBin(bin)
             }
@@ -487,11 +490,12 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         <ControlSection style={{ marginTop: '0.5em' }}>
           <ShortTandemRepeatPopulationOptions
             id={`${shortTandemRepeat.id}-genotype-distribution`}
-            populationIds={populationIds}
-            selectedPopulationId={selectedAncestryGroup}
-            onSelectPopulationId={setSelectedAncestryGroup}
+            ancestryGroups={ancestryGroups}
+            selectedAncestryGroup={selectedAncestryGroup}
+            selectedSex={selectedSex}
+            setSelectedAncestryGroup={setSelectedAncestryGroup}
+            setSelectedSex={setSelectedSex}
           />
-
           <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
             shortTandemRepeatOrAdjacentRepeat={shortTandemRepeat}
             value={selectedGenotypeDistributionRepeatUnits}
@@ -619,10 +623,12 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         </h2>
         <ControlSection style={{ marginBottom: '1em' }}>
           <ShortTandemRepeatPopulationOptions
-            id={`${shortTandemRepeat.id}-read-data`}
-            populationIds={populationIds}
-            selectedPopulationId={selectedAncestryGroup}
-            onSelectPopulationId={setSelectedAncestryGroup}
+            id={`${shortTandemRepeat.id}-genotype-distribution`}
+            ancestryGroups={ancestryGroups}
+            selectedAncestryGroup={selectedAncestryGroup}
+            selectedSex={selectedSex}
+            setSelectedAncestryGroup={setSelectedAncestryGroup}
+            setSelectedSex={setSelectedSex}
           />
         </ControlSection>
         <ShortTandemRepeatReads
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
index b8f041dbe..94810daae 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
@@ -25,10 +25,10 @@ const Wrapper = styled.div`
 type Props = {
   id: string
   ancestryGroups: AncestryGroupId[]
-  selectedAncestryGroup: AncestryGroupId
-  selectedSex: string
-  setSelectedAncestryGroup: Dispatch<SetStateAction<AncestryGroupId>>
-  setSelectedSex: Dispatch<SetStateAction<Sex>>
+  selectedAncestryGroup: AncestryGroupId | ''
+  selectedSex: Sex | ''
+  setSelectedAncestryGroup: Dispatch<SetStateAction<AncestryGroupId | ''>>
+  setSelectedSex: Dispatch<SetStateAction<Sex | ''>>
 }
 
 const ShortTandemRepeatPopulationOptions = ({
diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index 02e4e5e2f..53024293e 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -1,25 +1,57 @@
-const sumDistributions = (distributions: any) => {
-  const nByKey = distributions.flat().reduce((acc: any, d: any) => {
-    const key = d.slice(0, d.length - 1).join('/')
-    return {
-      ...acc,
-      [key]: (acc[key] || 0) + d[d.length - 1],
-    }
-  }, {})
-  return Object.entries(nByKey).map(([key, n]) => [...key.split('/').map(Number), n])
+import {
+  Sex,
+  ShortTandemRepeat,
+  AlleleSizeDistributionItem,
+  AlleleSizeDistributionCohort,
+} from './ShortTandemRepeatPage'
+import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
+
+type AlleleSizeDistributionFilters = {
+  selectedAncestryGroup: AncestryGroupId | ''
+  selectedSex: Sex | ''
+  selectedRepeatUnit: string
 }
 
+const addCohortToDistribution = (
+  cohort: AlleleSizeDistributionCohort,
+  distribution: Record<number, AlleleSizeDistributionItem>
+): Record<number, AlleleSizeDistributionItem> =>
+  cohort.distribution.reduce((acc, distributionItem) => {
+    const { repunit_count } = distributionItem
+    const existingItem = acc[repunit_count]
+    const countSoFar = existingItem ? existingItem.frequency : 0
+    const newItem: AlleleSizeDistributionItem = {
+      repunit_count: repunit_count,
+      frequency: countSoFar + distributionItem.frequency,
+    }
+    return { ...acc, [repunit_count]: newItem }
+  }, distribution)
+
 export const getSelectedAlleleSizeDistribution = (
-  shortTandemRepeatOrAdjacentRepeat: any,
-  { selectedRepeatUnit, selectedPopulationId }: any
-) => {
-  if (selectedRepeatUnit) {
+  shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat,
+  { selectedAncestryGroup, selectedSex, selectedRepeatUnit }: AlleleSizeDistributionFilters
+): AlleleSizeDistributionItem[] => {
+  const itemsByRepunitCount: Record<number, AlleleSizeDistributionItem> =
+    shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.reduce((acc, cohort) => {
+      if (selectedAncestryGroup !== '' && cohort.ancestry_group !== selectedAncestryGroup) {
+        return acc
+      }
+      if (selectedSex !== '' && cohort.sex !== selectedSex) {
+        return acc
+      }
+      if (cohort.repunit !== selectedRepeatUnit) {
+        return acc
+      }
+      return addCohortToDistribution(cohort, acc)
+    }, {} as Record<number, AlleleSizeDistributionItem>)
+  return Object.values(itemsByRepunitCount)
+}
+/*  if (selectedRepeatUnit) {
     // Repeat units grouped by classification are not valid for adjacent repeats.
     if (selectedRepeatUnit.startsWith('classification')) {
       const selectedClassification = selectedRepeatUnit.slice(15)
 
       const repeatUnitClassification = shortTandemRepeatOrAdjacentRepeat.repeat_units.reduce(
-        // @ts-expect-error TS(7006) FIXME: Parameter 'acc' implicitly has an 'any' type.
         (acc, repeatUnit) => ({
           ...acc,
           [repeatUnit.repeat_unit]: repeatUnit.classification,
@@ -58,7 +90,7 @@ export const getSelectedAlleleSizeDistribution = (
   }
 
   return shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.distribution
-}
+}*/
 
 export const getSelectedGenotypeDistribution = (
   shortTandemRepeatOrAdjacentRepeat: any,

From 2ab384323f2a3bdba3c562c9abfba088485f835d Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 22 Jul 2024 16:14:47 -0400
Subject: [PATCH 06/36] WIP genotype select

---
 ...TandemRepeatAlleleSizeDistributionPlot.tsx |  2 +-
 ...rtTandemRepeatGenotypeDistributionPlot.tsx | 41 +++++-----
 ...tGenotypeDistributionRepeatUnitsSelect.tsx | 81 ++++++++-----------
 .../ShortTandemRepeatPage.tsx                 | 51 +++++-------
 .../shortTandemRepeatHelpers.ts               |  1 +
 5 files changed, 76 insertions(+), 100 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index 88ab31647..a1d0819a4 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -47,7 +47,7 @@ type Range = { start: number; stop: number; label: string }
 type Props = {
   maxRepeats: number
   alleleSizeDistribution: AlleleSizeDistributionItem[]
-  repeatUnitLength: number
+  repeatUnitLength: number | null
   scaleType: ScaleType
   ranges: Range[]
   size: { width: number }
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
index a6e170bf2..cf4269fd6 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
@@ -6,6 +6,7 @@ import styled from 'styled-components'
 import { AxisBottom, AxisLeft } from '@visx/axis'
 
 import { TooltipAnchor } from '@gnomad/ui'
+import { GenotypeDistributionItem } from './ShortTandemRepeatPage'
 
 // The 100% width/height container is necessary the component
 // to size to fit its container vs staying at its initial size.
@@ -24,8 +25,8 @@ type PlotRange = { start: number; stop: number; label: string }
 
 type Props = {
   axisLabels: string[]
-  maxRepeats: number[]
-  genotypeDistribution: never
+  maxRepeats: [number, number]
+  genotypeDistribution: GenotypeDistributionItem[]
   xRanges: PlotRange[]
   yRanges: PlotRange[]
   onSelectBin: (bin: Bin) => void
@@ -69,7 +70,7 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
     const yBinSize = Math.max(1, Math.ceil(maxRepeats[1] / (plotHeight / 10)))
     const yNumBins = Math.floor(maxRepeats[1] / yBinSize) + 1
 
-    const data = Array.from(Array(xNumBins * yNumBins).keys()).map((n: any) => {
+    const data = Array.from(Array(xNumBins * yNumBins).keys()).map((n) => {
       const xBinIndex = Math.floor(n / yNumBins)
       const yBinIndex = n % yNumBins
 
@@ -102,11 +103,13 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
       return result
     })
 
-    genotypeDistribution.forEach(([repeats1, repeats2, nAlleles]) => {
-      const xBinIndex = Math.floor(repeats1 / xBinSize)
-      const yBinIndex = Math.floor(repeats2 / yBinSize)
-      data[xBinIndex * yNumBins + yBinIndex].count += nAlleles
-    })
+    genotypeDistribution.forEach(
+      ({ short_allele_repunit_count, long_allele_repunit_count, frequency }) => {
+        const xBinIndex = Math.floor(short_allele_repunit_count / xBinSize)
+        const yBinIndex = Math.floor(long_allele_repunit_count / yBinSize)
+        data[xBinIndex * yNumBins + yBinIndex].count += frequency
+      }
+    )
 
     const xScale = scaleBand<number>()
       .domain(Array.from(Array(xNumBins).keys()))
@@ -121,7 +124,7 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
     const xMaxNumLabels = Math.floor(plotWidth / 20)
     const xLabelInterval = Math.max(Math.round(xNumBins / xMaxNumLabels), 1)
 
-    const xTickFormat = (binIndex: any) => {
+    const xTickFormat = (binIndex: number) => {
       if (binIndex % xLabelInterval !== 0) {
         return ''
       }
@@ -133,7 +136,7 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
       return `${binIndex * xBinSize} - ${binIndex * xBinSize + xBinSize - 1}`
     }
 
-    const yTickFormat = (binIndex: any) => {
+    const yTickFormat = (binIndex: number) => {
       if (yBinSize === 1) {
         return `${binIndex}`
       }
@@ -142,7 +145,7 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
     }
 
     const opacityScale = scaleLog()
-      .domain([1, max(genotypeDistribution, (d: any) => d[2])])
+      .domain([1, max(genotypeDistribution, (d) => d.frequency) || 2])
       .range([0.1, 1])
 
     return (
@@ -201,8 +204,8 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
 
           <g transform={`translate(${margin.left},${margin.top})`}>
             {data
-              .filter((d: any) => d.count !== 0)
-              .map((d: any) => {
+              .filter((d) => d.count !== 0)
+              .map((d) => {
                 return (
                   <React.Fragment key={`${d.xBinIndex}-${d.yBinIndex}`}>
                     <TooltipAnchor
@@ -237,9 +240,9 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
 
           <g transform={`translate(${margin.left}, 0)`}>
             {xRanges
-              .filter((range: any) => range.start !== range.stop)
-              .filter((range: any) => range.start <= maxRepeats[0])
-              .map((range: any, rangeIndex: any, ranges: any) => {
+              .filter((range) => range.start !== range.stop)
+              .filter((range) => range.start <= maxRepeats[0])
+              .map((range, rangeIndex, ranges) => {
                 const startBinIndex = Math.floor(range.start / xBinSize)
                 const startX =
                   (xScale(startBinIndex) || 0) +
@@ -324,9 +327,9 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
 
           <g transform={`translate(${margin.left}, ${margin.top})`}>
             {yRanges
-              .filter((range: any) => range.start !== range.stop)
-              .filter((range: any) => range.start <= maxRepeats[1])
-              .map((range: any, rangeIndex: any, ranges: any) => {
+              .filter((range) => range.start !== range.stop)
+              .filter((range) => range.start <= maxRepeats[1])
+              .map((range, rangeIndex, ranges) => {
                 const startBinIndex = Math.floor(range.start / yBinSize)
                 const startY =
                   (yScale(startBinIndex) || 0) +
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
index 381f96e90..00bf12cbe 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
@@ -1,31 +1,24 @@
-import React from 'react'
+import React, { Dispatch, SetStateAction } from 'react'
 
 import { Select } from '@gnomad/ui'
+import { ShortTandemRepeat } from './ShortTandemRepeatPage'
 
 type Props = {
-  shortTandemRepeatOrAdjacentRepeat: {
-    id: string
-    associated_diseases?: any[]
-    reference_repeat_unit: string
-    genotype_distribution: {
-      repeat_units: {
-        repeat_units?: string[]
-      }[]
-    }
-    repeat_units: any[]
-  }
+  shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat
+  repunitPairs: string[]
   value: string
-  onChange: (...args: any[]) => any
+  onChange: Dispatch<SetStateAction<string>>
 }
 
 const ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect = ({
   shortTandemRepeatOrAdjacentRepeat,
   value,
+  repunitPairs,
   onChange,
 }: Props) => {
   // Adjacent repeats do not have classifications for repeat units.
   const isAdjacentRepeat = !shortTandemRepeatOrAdjacentRepeat.associated_diseases
-  const repeatUnitClassifications = isAdjacentRepeat
+  const repeatUnitClassifications: Record<string, string> = isAdjacentRepeat
     ? {}
     : shortTandemRepeatOrAdjacentRepeat.repeat_units.reduce(
         (acc, repeatUnit) => ({ ...acc, [repeatUnit.repeat_unit]: repeatUnit.classification }),
@@ -40,44 +33,38 @@ const ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect = ({
       <Select
         id={`short-tandem-repeat-${shortTandemRepeatOrAdjacentRepeat.id}-genotype-distribution-repeat-units`}
         value={value}
-        onChange={(e: any) => {
+        onChange={(e: { target: { value: string } }) => {
           onChange(e.target.value)
         }}
       >
-        {shortTandemRepeatOrAdjacentRepeat.genotype_distribution.repeat_units.length > 1 && (
-          <option value="">All</option>
-        )}
+        {repunitPairs.length > 1 && <option value="">All</option>}
         <optgroup label="Repeat unit pairs (only pairs found in gnomAD are listed here)">
-          {shortTandemRepeatOrAdjacentRepeat.genotype_distribution.repeat_units.map(
-            (repeatUnitDistribution) => {
-              // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-              const optionValue = repeatUnitDistribution.repeat_units.join(' / ')
-              return (
-                <option key={optionValue} value={optionValue}>
-                  {/* @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'. */}
-                  {repeatUnitDistribution.repeat_units
-                    .map((repeatUnit) => {
-                      const notes = []
-                      if (repeatUnitClassifications[repeatUnit]) {
-                        notes.push(repeatUnitClassifications[repeatUnit])
-                      }
-                      if (repeatUnit === shortTandemRepeatOrAdjacentRepeat.reference_repeat_unit) {
-                        notes.push('reference')
-                      }
+          {repunitPairs.map((pair) => {
+            return (
+              <option key={pair} value={pair}>
+                {pair
+                  .split(' / ')
+                  .map((repeatUnit) => {
+                    const notes = []
+                    if (repeatUnitClassifications[repeatUnit]) {
+                      notes.push(repeatUnitClassifications[repeatUnit])
+                    }
+                    if (repeatUnit === shortTandemRepeatOrAdjacentRepeat.reference_repeat_unit) {
+                      notes.push('reference')
+                    }
 
-                      if (
-                        shortTandemRepeatOrAdjacentRepeat.repeat_units.length > 1 &&
-                        notes.length > 0
-                      ) {
-                        return `${repeatUnit} (${notes.join(', ')})`
-                      }
-                      return repeatUnit
-                    })
-                    .join(' / ')}
-                </option>
-              )
-            }
-          )}
+                    if (
+                      shortTandemRepeatOrAdjacentRepeat.repeat_units.length > 1 &&
+                      notes.length > 0
+                    ) {
+                      return `${repeatUnit} (${notes.join(', ')})`
+                    }
+                    return repeatUnit
+                  })
+                  .join(' / ')}
+              </option>
+            )
+          })}
         </optgroup>
       </Select>
     </label>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index e2ad9d95c..929f4c81c 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -1,4 +1,3 @@
-import { max, min } from 'd3-array'
 import React, { useState } from 'react'
 import styled from 'styled-components'
 
@@ -51,7 +50,7 @@ export type AlleleSizeDistributionCohort = {
   distribution: AlleleSizeDistributionItem[]
 }
 
-type GenotypeDistributionItem = {
+export type GenotypeDistributionItem = {
   short_allele_repunit_count: number
   long_allele_repunit_count: number
   frequency: number
@@ -123,21 +122,6 @@ const FlexWrapper = styled.div`
   width: 100%;
 `
 
-const parseCombinedPopulationId = (combinedPopulationId: any) => {
-  let population
-  let sex
-  if (combinedPopulationId.includes('_')) {
-    ;[population, sex] = combinedPopulationId.split('_')
-  } else if (combinedPopulationId === 'XX' || combinedPopulationId === 'XY') {
-    population = null
-    sex = combinedPopulationId
-  } else {
-    population = combinedPopulationId
-    sex = null
-  }
-  return { population, sex }
-}
-
 type ShortTandemRepeatPageProps = {
   datasetId: DatasetId
   shortTandemRepeat: ShortTandemRepeat
@@ -148,12 +132,16 @@ export type ScaleType = 'linear' | 'log'
 const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepeatPageProps) => {
   const { allele_size_distribution, genotype_distribution } = shortTandemRepeat
 
-  const alleleSizeDistributionRepunits = allele_size_distribution
-    .map((cohort) => cohort.repunit)
-    .sort()
-  const genotypeDistributionRepunitPairs = genotype_distribution
-    .map((cohort) => [cohort.short_allele_repunit, cohort.long_allele_repunit].join(', '))
-    .sort()
+  const alleleSizeDistributionRepunits = [
+    ...new Set(allele_size_distribution.map((cohort) => cohort.repunit)),
+  ].sort()
+  const genotypeDistributionRepunitPairs = [
+    ...new Set(
+      genotype_distribution.map((cohort) =>
+        [cohort.short_allele_repunit, cohort.long_allele_repunit].join(' / ')
+      )
+    ),
+  ].sort()
 
   const defaultAlleleSizeRepunit =
     alleleSizeDistributionRepunits.length === 1 ? alleleSizeDistributionRepunits[0] : ''
@@ -166,7 +154,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
   const [selectedAlleleSizeRepeatUnit, setSelectedAlleleSizeRepeatUnit] =
     useState<string>(defaultAlleleSizeRepunit)
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
-    useState<string>(defaultGenotypeDistributionRepunits)
+    useState<string | ''>(defaultGenotypeDistributionRepunits)
   const [selectedDisease, setSelectedDisease] = useState<string>(defaultDisease)
   const [selectedScaleType, setSelectedScaleType] = useState<ScaleType>('linear')
   const [showAdjacentRepeats, setShowAdjacentRepeats] = useState<boolean>(false)
@@ -181,6 +169,9 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
     )
   )
 
+  const maxGenotypeDistributionShortAlleleRepeats = 0 // TK
+  const maxGenotypeDistributionLongAlleleRepeats = 0 // TK
+
   const allRepeatUnitsByClassification: Record<string, string[]> = {}
   shortTandemRepeat.repeat_units.forEach((repeatUnit) => {
     if (allRepeatUnitsByClassification[repeatUnit.classification] === undefined) {
@@ -447,17 +438,12 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           Genotype Distribution <InfoButton topic="str-genotype-distribution" />
         </h2>
         <ShortTandemRepeatGenotypeDistributionPlot
-          // @ts-expect-error TS(2322) FIXME: Type '{ axisLabels: any; maxRepeats: (string | und... Remove this comment to see the full error message
           axisLabels={getGenotypeDistributionPlotAxisLabels(shortTandemRepeat, {
             selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
           })}
           maxRepeats={[
-            max(shortTandemRepeat.genotype_distribution.distribution, (d: any) =>
-              max(d.slice(0, 2))
-            ),
-            max(shortTandemRepeat.genotype_distribution.distribution, (d: any) =>
-              min(d.slice(0, 2))
-            ),
+            maxGenotypeDistributionLongAlleleRepeats,
+            maxGenotypeDistributionShortAlleleRepeats,
           ]}
           genotypeDistribution={getSelectedGenotypeDistribution(shortTandemRepeat, {
             selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
@@ -498,6 +484,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           />
           <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
             shortTandemRepeatOrAdjacentRepeat={shortTandemRepeat}
+            repunitPairs={genotypeDistributionRepunitPairs}
             value={selectedGenotypeDistributionRepeatUnits}
             onChange={setSelectedGenotypeDistributionRepeatUnits}
           />
@@ -566,7 +553,6 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           Age Distribution <InfoButton topic="str-age-distribution" />
         </h2>
         <ShortTandemRepeatAgeDistributionPlot
-          // @ts-expect-error TS(2322) FIXME: Type '{ ageDistribution: any; maxRepeats: number; ... Remove this comment to see the full error message
           ageDistribution={(shortTandemRepeat as any).age_distribution}
           maxRepeats={maxAlleleSizeDistributionRepeats}
           ranges={allRepeatUnitsFoundInGnomadArePathogenic ? plotRanges : []}
@@ -589,7 +575,6 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
                 <ShortTandemRepeatAdjacentRepeatSection
                   key={adjacentRepeat.id}
                   adjacentRepeat={adjacentRepeat}
-                  populationIds={populationIds}
                   selectedPopulationId={selectedAncestryGroup}
                   onSelectPopulationId={setSelectedAncestryGroup}
                   selectedScaleType={selectedScaleType}
diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index 53024293e..b13d0b50f 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -31,6 +31,7 @@ export const getSelectedAlleleSizeDistribution = (
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat,
   { selectedAncestryGroup, selectedSex, selectedRepeatUnit }: AlleleSizeDistributionFilters
 ): AlleleSizeDistributionItem[] => {
+  // TK figure out what's up with classification
   const itemsByRepunitCount: Record<number, AlleleSizeDistributionItem> =
     shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.reduce((acc, cohort) => {
       if (selectedAncestryGroup !== '' && cohort.ancestry_group !== selectedAncestryGroup) {

From 798e8f4237c86fa360fcea364f1ffefc3c0c245a Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 22 Jul 2024 16:34:14 -0400
Subject: [PATCH 07/36] WIP age dist

---
 .../ShortTandemRepeatAgeDistributionPlot.tsx  | 71 ++++++-------------
 .../ShortTandemRepeatPage.tsx                 | 16 ++++-
 2 files changed, 35 insertions(+), 52 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAgeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAgeDistributionPlot.tsx
index 8fa875668..f93abbac4 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAgeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAgeDistributionPlot.tsx
@@ -1,12 +1,12 @@
 import { max } from 'd3-array'
 import { scaleBand, scaleLog } from 'd3-scale'
-import PropTypes from 'prop-types'
 import React from 'react'
 import { withSize } from 'react-sizeme'
 import styled from 'styled-components'
 import { AxisBottom, AxisLeft } from '@visx/axis'
 
 import { TooltipAnchor } from '@gnomad/ui'
+import { PlotRange, AgeDistributionItem } from './ShortTandemRepeatPage'
 
 // The 100% width/height container is necessary the component
 // to size to fit its container vs staying at its initial size.
@@ -19,9 +19,9 @@ const GraphWrapper = styled.div`
 const labelProps = {
   fontSize: 14,
   textAnchor: 'middle',
-}
+} as const
 
-const ageRangeLabel = (ageRange: any) => {
+const ageRangeLabel = (ageRange: [number | null, number | null]) => {
   const [minAge, maxAge] = ageRange
 
   if (minAge === null) {
@@ -33,9 +33,15 @@ const ageRangeLabel = (ageRange: any) => {
   return `${minAge}-${maxAge}`
 }
 
+type Props = {
+  ageDistribution: AgeDistributionItem[]
+  maxRepeats: number
+  ranges: PlotRange[]
+  size: { width: number }
+}
+
 const ShortTandemRepeatAgeDistributionPlot = withSize()(
-  // @ts-expect-error TS(2339) FIXME: Property 'ageDistribution' does not exist on type ... Remove this comment to see the full error message
-  ({ ageDistribution, maxRepeats, ranges, size: { width } }) => {
+  ({ ageDistribution, maxRepeats, ranges = [], size: { width } }: Props) => {
     const height = Math.min(width, 300)
 
     const margin = {
@@ -76,22 +82,19 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
       }
     })
 
-    ageDistribution.forEach((ageBin: any, yBinIndex: any) => {
-      // @ts-expect-error TS(7031) FIXME: Binding element 'repeats' implicitly has an 'any' ... Remove this comment to see the full error message
+    ageDistribution.forEach((ageBin, yBinIndex) => {
       ageBin.distribution.forEach(([repeats, nAlleles]) => {
         const xBinIndex = Math.floor(repeats / xBinSize)
         data[xBinIndex * yNumBins + yBinIndex].count += nAlleles
       })
     })
 
-    const xScale = scaleBand()
-      // @ts-expect-error TS(2345) FIXME: Argument of type 'number[]' is not assignable to p... Remove this comment to see the full error message
+    const xScale = scaleBand<number>()
       .domain(Array.from(Array(xNumBins).keys()))
       .range([0, plotWidth])
     const xBandwidth = xScale.bandwidth()
 
-    const yScale = scaleBand()
-      // @ts-expect-error TS(2345) FIXME: Argument of type 'number[]' is not assignable to p... Remove this comment to see the full error message
+    const yScale = scaleBand<number>()
       .domain(Array.from(Array(yNumBins).keys()))
       .range([plotHeight, 0])
     const yBandwidth = yScale.bandwidth()
@@ -116,11 +119,7 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
     }
 
     const opacityScale = scaleLog()
-      // @ts-expect-error TS(2345) FIXME: Argument of type '(string | number | undefined)[]'... Remove this comment to see the full error message
-      .domain([
-        1,
-        max(ageDistribution, (ageBin: any) => max(ageBin.distribution, (d: any) => d[1])),
-      ])
+      .domain([1, max(ageDistribution, (ageBin) => max(ageBin.distribution, (d: any) => d[1]))])
       .range([0.1, 1])
 
     return (
@@ -129,7 +128,6 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
           <AxisBottom
             label="Repeats"
             labelOffset={xBinSize === 1 ? 10 : 30}
-            // @ts-expect-error TS(2322) FIXME: Type '{ fontSize: number; textAnchor: string; }' i... Remove this comment to see the full error message
             labelProps={labelProps}
             left={margin.left}
             scale={xScale}
@@ -153,8 +151,7 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
                       fontSize: 10,
                       textAnchor: 'end',
                       transform: `translate(0, 0), rotate(-40 ${
-                        // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                        xScale(binIndex) + xBandwidth / 2
+                        (xScale(binIndex) || 0) + xBandwidth / 2
                       }, 0)`,
                     }
                   }
@@ -164,7 +161,6 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
           <AxisLeft
             label="Age"
             labelOffset={42}
-            // @ts-expect-error TS(2322) FIXME: Type '{ fontSize: number; textAnchor: string; }' i... Remove this comment to see the full error message
             labelProps={labelProps}
             left={margin.left}
             scale={yScale}
@@ -212,21 +208,19 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
 
           <g transform={`translate(${margin.left}, 0)`}>
             {ranges
-              .filter((range: any) => range.start !== range.stop)
-              .filter((range: any) => range.start <= maxRepeats)
-              .map((range: any, rangeIndex: any) => {
+              .filter((range) => range.start !== range.stop)
+              .filter((range) => range.start <= maxRepeats)
+              .map((range, rangeIndex) => {
                 const startBinIndex = Math.floor(range.start / xBinSize)
                 const startX =
-                  // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                  xScale(startBinIndex) +
+                  (xScale(startBinIndex) || 0) +
                   ((range.start - startBinIndex * xBinSize) / xBinSize) * xBandwidth
 
                 let stopX
                 if (range.stop <= maxRepeats) {
                   const stopBinIndex = Math.floor(range.stop / xBinSize)
                   stopX =
-                    // @ts-expect-error TS(2532) FIXME: Object is possibly 'undefined'.
-                    xScale(stopBinIndex) +
+                    (xScale(stopBinIndex) || 0) +
                     ((range.stop - stopBinIndex * xBinSize) / xBinSize) * xBandwidth
                 } else {
                   stopX = plotWidth
@@ -306,27 +300,4 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
 
 ShortTandemRepeatAgeDistributionPlot.displayName = 'ShortTandemRepeatAgeDistributionPlot'
 
-ShortTandemRepeatAgeDistributionPlot.propTypes = {
-  // @ts-expect-error TS(2322) FIXME: Type '{ ageDistribution: PropTypes.Requireable<(Pr... Remove this comment to see the full error message
-  ageDistribution: PropTypes.arrayOf(
-    PropTypes.shape({
-      age_range: PropTypes.arrayOf(PropTypes.number).isRequired,
-      distribution: PropTypes.arrayOf(PropTypes.arrayOf(PropTypes.number)).isRequired,
-    })
-  ),
-  maxRepeats: PropTypes.number.isRequired,
-  ranges: PropTypes.arrayOf(
-    PropTypes.shape({
-      start: PropTypes.number.isRequired,
-      stop: PropTypes.number.isRequired,
-      label: PropTypes.string.isRequired,
-    })
-  ),
-}
-
-ShortTandemRepeatAgeDistributionPlot.defaultProps = {
-  // @ts-expect-error TS(2322) FIXME: Type '{ ranges: never[]; }' is not assignable to t... Remove this comment to see the full error message
-  ranges: [],
-}
-
 export default ShortTandemRepeatAgeDistributionPlot
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 929f4c81c..561c4de89 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -66,6 +66,11 @@ type GenotypeDistributionCohort = {
   distribution: GenotypeDistributionItem[]
 }
 
+export type AgeDistributionItem = {
+  age_range: [number | null, number | null]
+  distribution: number[][]
+}
+
 export type ShortTandemRepeatAdjacentRepeat = {
   id: string
   reference_region: ShortTandemRepeatReferenceRegion
@@ -75,6 +80,12 @@ export type ShortTandemRepeatAdjacentRepeat = {
   genotype_distribution: GenotypeDistributionCohort[]
 }
 
+export type PlotRange = {
+  label: string
+  start: number
+  stop: number
+}
+
 export type ShortTandemRepeat = {
   id: string
   gene: {
@@ -104,6 +115,7 @@ export type ShortTandemRepeat = {
   }[]
   allele_size_distribution: AlleleSizeDistributionCohort[]
   genotype_distribution: GenotypeDistributionCohort[]
+  age_distribution: AgeDistributionItem[]
   adjacent_repeats: ShortTandemRepeatAdjacentRepeat[]
 }
 
@@ -209,7 +221,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
     ? diseaseToPlot.repeat_size_classifications
     : []
 
-  const plotRanges = repeatSizeClassificationsToPlot.map((classification) => {
+  const plotRanges: PlotRange[] = repeatSizeClassificationsToPlot.map((classification) => {
     return {
       label: classification.classification,
       start: classification.min !== null ? classification.min : 0,
@@ -553,7 +565,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           Age Distribution <InfoButton topic="str-age-distribution" />
         </h2>
         <ShortTandemRepeatAgeDistributionPlot
-          ageDistribution={(shortTandemRepeat as any).age_distribution}
+          ageDistribution={shortTandemRepeat.age_distribution}
           maxRepeats={maxAlleleSizeDistributionRepeats}
           ranges={allRepeatUnitsFoundInGnomadArePathogenic ? plotRanges : []}
         />

From 83ae794e811c5080850136791b5dbca90424db3e Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Wed, 24 Jul 2024 17:23:42 -0400
Subject: [PATCH 08/36] WIP more refactor

---
 ...ShortTandemRepeatAdjacentRepeatSection.tsx |  76 +++++------
 ...TandemRepeatAlleleSizeDistributionPlot.tsx |   2 +-
 ...emRepeatGenotypeDistributionBinDetails.tsx |  24 ++--
 ...tGenotypeDistributionRepeatUnitsSelect.tsx |  36 ++---
 .../ShortTandemRepeatPage.tsx                 |  79 +++++------
 .../ShortTandemRepeatReads.tsx                | 126 ++++++++----------
 .../shortTandemRepeatHelpers.ts               | 102 +++++++++++++-
 7 files changed, 261 insertions(+), 184 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
index 81c9bcde4..db9900076 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
@@ -1,12 +1,11 @@
-import { max, min } from 'd3-array'
-import React, { useState } from 'react'
+import React, { SetStateAction, useState, Dispatch } from 'react'
 
 import { Modal, Select } from '@gnomad/ui'
 
 import ControlSection from '../VariantPage/ControlSection'
 
 import ShortTandemRepeatPopulationOptions from './ShortTandemRepeatPopulationOptions'
-import { ShortTandemRepeatAdjacentRepeat } from './ShortTandemRepeatPage'
+import { ShortTandemRepeatAdjacentRepeat, ScaleType, Sex } from './ShortTandemRepeatPage'
 import ShortTandemRepeatAlleleSizeDistributionPlot from './ShortTandemRepeatAlleleSizeDistributionPlot'
 import ShortTandemRepeatGenotypeDistributionPlot from './ShortTandemRepeatGenotypeDistributionPlot'
 import ShortTandemRepeatGenotypeDistributionBinDetails from './ShortTandemRepeatGenotypeDistributionBinDetails'
@@ -16,35 +15,40 @@ import {
   getSelectedAlleleSizeDistribution,
   getSelectedGenotypeDistribution,
   getGenotypeDistributionPlotAxisLabels,
+  maxAlleleSizeDistributionRepeats,
+  maxGenotypeDistributionRepeats,
 } from './shortTandemRepeatHelpers'
+import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
+import { Bin as GenotypeBin } from './ShortTandemRepeatGenotypeDistributionPlot'
 
 type Props = {
   adjacentRepeat: ShortTandemRepeatAdjacentRepeat
-  populationIds: string[]
-  selectedPopulationId: string
-  onSelectPopulationId: (...args: any[]) => any
-  selectedScaleType: string
-  onSelectScaleType: (...args: any[]) => any
+  selectedScaleType: ScaleType
+  selectedAncestryGroup: AncestryGroupId | ''
+  selectedSex: Sex | ''
+  ancestryGroups: AncestryGroupId[]
+  selectedGenotypeDistributionBin: GenotypeBin | null
+  setSelectedGenotypeDistributionBin: Dispatch<SetStateAction<GenotypeBin | null>>
+  setSelectedScaleType: Dispatch<SetStateAction<ScaleType>>
+  setSelectedAncestryGroup: Dispatch<SetStateAction<AncestryGroupId | ''>>
+  setSelectedSex: Dispatch<SetStateAction<Sex | ''>>
 }
 
 const ShortTandemRepeatAdjacentRepeatSection = ({
   adjacentRepeat,
-  populationIds,
-  selectedPopulationId,
-  onSelectPopulationId,
+  ancestryGroups,
   selectedScaleType,
-  onSelectScaleType,
+  selectedAncestryGroup,
+  selectedSex,
+  setSelectedScaleType,
+  setSelectedAncestryGroup,
+  setSelectedSex,
 }: Props) => {
   const [selectedRepeatUnit, setSelectedRepeatUnit] = useState(
     adjacentRepeat.repeat_units.length === 1 ? adjacentRepeat.repeat_units[0] : ''
   )
-
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
-    useState(
-      adjacentRepeat.genotype_distribution.repeat_units.length === 1
-        ? adjacentRepeat.genotype_distribution.repeat_units[0].repeat_units.join(' / ')
-        : ''
-    )
+    useState<string>(defaultGenotypeDistributionRepeatUnits)
 
   const [selectedGenotypeDistributionBin, setSelectedGenotypeDistributionBin] = useState(null)
 
@@ -55,14 +59,10 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
 
       <h4 style={{ marginBottom: '0.66em' }}>Allele Size Distribution</h4>
       <ShortTandemRepeatAlleleSizeDistributionPlot
-        // @ts-expect-error TS(2322) FIXME: Type '{ maxRepeats: number; alleleSizeDistribution... Remove this comment to see the full error message
-        maxRepeats={
-          adjacentRepeat.allele_size_distribution.distribution[
-            adjacentRepeat.allele_size_distribution.distribution.length - 1
-          ][0]
-        }
+        maxRepeats={maxAlleleSizeDistributionRepeats(adjacentRepeat)}
         alleleSizeDistribution={getSelectedAlleleSizeDistribution(adjacentRepeat, {
-          selectedPopulationId,
+          selectedAncestryGroup,
+          selectedSex,
           selectedRepeatUnit,
         })}
         repeatUnitLength={selectedRepeatUnit ? selectedRepeatUnit.length : null}
@@ -71,9 +71,11 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
       <ControlSection>
         <ShortTandemRepeatPopulationOptions
           id={`${adjacentRepeat.id}-repeat-counts`}
-          populationIds={populationIds}
-          selectedPopulationId={selectedPopulationId}
-          onSelectPopulationId={onSelectPopulationId}
+          ancestryGroups={ancestryGroups}
+          selectedAncestryGroup={selectedAncestryGroup}
+          selectedSex={selectedSex}
+          setSelectedAncestryGroup={setSelectedAncestryGroup}
+          setSelectedSex={setSelectedSex}
         />
 
         <label htmlFor={`short-tandem-repeat-${adjacentRepeat.id}-repeat-unit`}>
@@ -103,7 +105,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
             id={`short-tandem-repeat-${adjacentRepeat.id}-repeat-counts-scale`}
             value={selectedScaleType}
             onChange={(e: any) => {
-              onSelectScaleType(e.target.value)
+              setSelectedScaleType(e.target.value)
             }}
           >
             <option value="linear">Linear</option>
@@ -114,17 +116,12 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
 
       <h4 style={{ marginBottom: '0.66em' }}>Genotype Distribution</h4>
       <ShortTandemRepeatGenotypeDistributionPlot
-        // @ts-expect-error TS(2322) FIXME: Type '{ axisLabels: any; maxRepeats: (string | und... Remove this comment to see the full error message
         axisLabels={getGenotypeDistributionPlotAxisLabels(adjacentRepeat, {
           selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
         })}
-        maxRepeats={[
-          max(adjacentRepeat.genotype_distribution.distribution, (d: any) => max(d.slice(0, 2))),
-          max(adjacentRepeat.genotype_distribution.distribution, (d: any) => min(d.slice(0, 2))),
-        ]}
+        maxRepeats={maxGenotypeDistributionRepeats(adjacentRepeat)}
         genotypeDistribution={getSelectedGenotypeDistribution(adjacentRepeat, {
           selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
-          selectedPopulationId,
         })}
         onSelectBin={(bin: any) => {
           if (bin.xRange[0] !== bin.xRange[1] || bin.yRange[0] !== bin.yRange[1]) {
@@ -136,9 +133,11 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
       <ControlSection>
         <ShortTandemRepeatPopulationOptions
           id={`${adjacentRepeat.id}-genotype-distribution`}
-          populationIds={populationIds}
-          selectedPopulationId={selectedPopulationId}
-          onSelectPopulationId={onSelectPopulationId}
+          ancestryGroups={ancestryGroups}
+          selectedAncestryGroup={selectedAncestryGroup}
+          selectedSex={selectedSex}
+          setSelectedAncestryGroup={setSelectedAncestryGroup}
+          setSelectedSex={setSelectedSex}
         />
 
         <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
@@ -160,7 +159,6 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
         >
           <ShortTandemRepeatGenotypeDistributionBinDetails
             shortTandemRepeatOrAdjacentRepeat={adjacentRepeat}
-            selectedPopulationId={selectedPopulationId}
             selectedRepeatUnits={selectedGenotypeDistributionRepeatUnits}
             bin={selectedGenotypeDistributionBin}
           />
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index a1d0819a4..a05f94760 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -49,7 +49,7 @@ type Props = {
   alleleSizeDistribution: AlleleSizeDistributionItem[]
   repeatUnitLength: number | null
   scaleType: ScaleType
-  ranges: Range[]
+  ranges?: Range[]
   size: { width: number }
 }
 
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
index ac497fac3..3619fde9f 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
@@ -2,13 +2,16 @@ import React from 'react'
 
 import { List, ListItem } from '@gnomad/ui'
 
-import { ShortTandemRepeat, ShortTandemRepeatAdjacentRepeat } from './ShortTandemRepeatPage'
+import { ShortTandemRepeat, ShortTandemRepeatAdjacentRepeat, Sex } from './ShortTandemRepeatPage'
 import { getSelectedGenotypeDistribution } from './shortTandemRepeatHelpers'
+import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 type Props = {
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
-  selectedPopulationId: string
-  selectedRepeatUnits: string
+  selectedAncestryGroup: AncestryGroupId | ''
+  selectedSex: Sex | ''
+  selectedRepeatUnits: string[] | ''
+  repeatUnitPairs: string[][]
   bin: {
     label: string
     xRange: number[]
@@ -18,13 +21,16 @@ type Props = {
 
 const ShortTandemRepeatGenotypeDistributionBinDetails = ({
   shortTandemRepeatOrAdjacentRepeat,
-  selectedPopulationId,
+  selectedAncestryGroup,
+  selectedSex,
   selectedRepeatUnits,
+  repeatUnitPairs,
   bin,
 }: Props) => {
   const genotypeDistribution = getSelectedGenotypeDistribution(shortTandemRepeatOrAdjacentRepeat, {
-    selectedPopulationId,
+    selectedAncestryGroup,
     selectedRepeatUnits,
+    selectedSex,
   })
 
   const isInBin = (d: any) =>
@@ -47,13 +53,13 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
           <h3>Repeat Units</h3>
           {/* @ts-expect-error TS(2745) FIXME: This JSX tag's 'children' prop expects type 'never... Remove this comment to see the full error message */}
           <List>
-            {shortTandemRepeatOrAdjacentRepeat.genotype_distribution.repeat_units
-              .map((repeatUnitsDistribution) => repeatUnitsDistribution.repeat_units)
+            {repeatUnitPairs
               .map((repeatUnits) => ({
                 repeatUnits,
                 distribution: getSelectedGenotypeDistribution(shortTandemRepeatOrAdjacentRepeat, {
-                  selectedPopulationId,
-                  selectedRepeatUnits: repeatUnits.join(' / '),
+                  selectedAncestryGroup,
+                  selectedSex,
+                  selectedRepeatUnits: repeatUnits,
                 }),
               }))
               .flatMap(({ repeatUnits, distribution }: any) => [
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
index 00bf12cbe..05a426835 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
@@ -1,30 +1,36 @@
 import React, { Dispatch, SetStateAction } from 'react'
 
 import { Select } from '@gnomad/ui'
-import { ShortTandemRepeat } from './ShortTandemRepeatPage'
+import { ShortTandemRepeat, ShortTandemRepeatAdjacentRepeat } from './ShortTandemRepeatPage'
+import { genotypeRepunitPairs } from './shortTandemRepeatHelpers'
 
 type Props = {
-  shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat
-  repunitPairs: string[]
-  value: string
-  onChange: Dispatch<SetStateAction<string>>
+  shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
+  selectedRepeatUnits: string[] | ''
+  setSelectedRepeatUnits: Dispatch<SetStateAction<string[] | ''>>
 }
 
+const isAdjacentRepeat = (
+  obj: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
+): obj is ShortTandemRepeatAdjacentRepeat => !obj.hasOwnProperty('associated_diseases')
+
 const ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect = ({
   shortTandemRepeatOrAdjacentRepeat,
-  value,
-  repunitPairs,
-  onChange,
+  selectedRepeatUnits,
+  setSelectedRepeatUnits,
 }: Props) => {
   // Adjacent repeats do not have classifications for repeat units.
-  const isAdjacentRepeat = !shortTandemRepeatOrAdjacentRepeat.associated_diseases
-  const repeatUnitClassifications: Record<string, string> = isAdjacentRepeat
+  const repeatUnitClassifications: Record<string, string> = isAdjacentRepeat(
+    shortTandemRepeatOrAdjacentRepeat
+  )
     ? {}
     : shortTandemRepeatOrAdjacentRepeat.repeat_units.reduce(
         (acc, repeatUnit) => ({ ...acc, [repeatUnit.repeat_unit]: repeatUnit.classification }),
         {}
       )
 
+  const repunitPairs = genotypeRepunitPairs(shortTandemRepeatOrAdjacentRepeat)
+
   return (
     <label
       htmlFor={`short-tandem-repeat-${shortTandemRepeatOrAdjacentRepeat.id}-genotype-distribution-repeat-units`}
@@ -32,18 +38,18 @@ const ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect = ({
       Repeat units: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
       <Select
         id={`short-tandem-repeat-${shortTandemRepeatOrAdjacentRepeat.id}-genotype-distribution-repeat-units`}
-        value={value}
-        onChange={(e: { target: { value: string } }) => {
-          onChange(e.target.value)
+        value={selectedRepeatUnits === '' ? '' : selectedRepeatUnits.join(' / ')}
+        onChange={({ target: { value } }: { target: { value: string } }) => {
+          const newPair: string[] | '' = value === '' ? '' : value.split(' / ')
+          setSelectedRepeatUnits(newPair)
         }}
       >
         {repunitPairs.length > 1 && <option value="">All</option>}
         <optgroup label="Repeat unit pairs (only pairs found in gnomAD are listed here)">
           {repunitPairs.map((pair) => {
             return (
-              <option key={pair} value={pair}>
+              <option key={pair.join(' / ')} value={pair.join(' / ')}>
                 {pair
-                  .split(' / ')
                   .map((repeatUnit) => {
                     const notes = []
                     if (repeatUnitClassifications[repeatUnit]) {
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 561c4de89..77727ceaa 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -24,6 +24,9 @@ import {
   getSelectedAlleleSizeDistribution,
   getSelectedGenotypeDistribution,
   getGenotypeDistributionPlotAxisLabels,
+  maxAlleleSizeDistributionRepeats,
+  maxGenotypeDistributionRepeats,
+  genotypeRepunitPairs,
 } from './shortTandemRepeatHelpers'
 import ShortTandemRepeatAdjacentRepeatSection from './ShortTandemRepeatAdjacentRepeatSection'
 import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
@@ -56,7 +59,7 @@ export type GenotypeDistributionItem = {
   frequency: number
 }
 
-type GenotypeDistributionCohort = {
+export type GenotypeDistributionCohort = {
   ancestry_group: string
   sex: Sex
   short_allele_repunit: string
@@ -142,18 +145,12 @@ type ShortTandemRepeatPageProps = {
 export type ScaleType = 'linear' | 'log'
 
 const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepeatPageProps) => {
-  const { allele_size_distribution, genotype_distribution } = shortTandemRepeat
+  const { allele_size_distribution } = shortTandemRepeat
 
   const alleleSizeDistributionRepunits = [
     ...new Set(allele_size_distribution.map((cohort) => cohort.repunit)),
   ].sort()
-  const genotypeDistributionRepunitPairs = [
-    ...new Set(
-      genotype_distribution.map((cohort) =>
-        [cohort.short_allele_repunit, cohort.long_allele_repunit].join(' / ')
-      )
-    ),
-  ].sort()
+  const genotypeDistributionRepunitPairs = genotypeRepunitPairs(shortTandemRepeat)
 
   const defaultAlleleSizeRepunit =
     alleleSizeDistributionRepunits.length === 1 ? alleleSizeDistributionRepunits[0] : ''
@@ -166,7 +163,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
   const [selectedAlleleSizeRepeatUnit, setSelectedAlleleSizeRepeatUnit] =
     useState<string>(defaultAlleleSizeRepunit)
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
-    useState<string | ''>(defaultGenotypeDistributionRepunits)
+    useState<string[] | ''>(defaultGenotypeDistributionRepunits)
   const [selectedDisease, setSelectedDisease] = useState<string>(defaultDisease)
   const [selectedScaleType, setSelectedScaleType] = useState<ScaleType>('linear')
   const [showAdjacentRepeats, setShowAdjacentRepeats] = useState<boolean>(false)
@@ -175,15 +172,6 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
     ...new Set(shortTandemRepeat.allele_size_distribution.map((cohort) => cohort.ancestry_group)),
   ].sort()
 
-  const maxAlleleSizeDistributionRepeats = Math.max(
-    ...shortTandemRepeat.allele_size_distribution.flatMap((cohort) =>
-      cohort.distribution.map((item) => item.repunit_count)
-    )
-  )
-
-  const maxGenotypeDistributionShortAlleleRepeats = 0 // TK
-  const maxGenotypeDistributionLongAlleleRepeats = 0 // TK
-
   const allRepeatUnitsByClassification: Record<string, string[]> = {}
   shortTandemRepeat.repeat_units.forEach((repeatUnit) => {
     if (allRepeatUnitsByClassification[repeatUnit.classification] === undefined) {
@@ -232,6 +220,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
   const [selectedGenotypeDistributionBin, setSelectedGenotypeDistributionBin] =
     useState<GenotypeBin | null>(null)
 
+  const maxAlleleRepeats = maxAlleleSizeDistributionRepeats(shortTandemRepeat)
   return (
     <>
       <FlexWrapper style={{ marginBottom: '3em' }}>
@@ -280,7 +269,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           Allele Size Distribution <InfoButton topic="str-allele-size-distribution" />
         </h2>
         <ShortTandemRepeatAlleleSizeDistributionPlot
-          maxRepeats={maxAlleleSizeDistributionRepeats}
+          maxRepeats={maxAlleleRepeats}
           alleleSizeDistribution={getSelectedAlleleSizeDistribution(shortTandemRepeat, {
             selectedAncestryGroup,
             selectedSex,
@@ -453,19 +442,17 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           axisLabels={getGenotypeDistributionPlotAxisLabels(shortTandemRepeat, {
             selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
           })}
-          maxRepeats={[
-            maxGenotypeDistributionLongAlleleRepeats,
-            maxGenotypeDistributionShortAlleleRepeats,
-          ]}
+          maxRepeats={maxGenotypeDistributionRepeats(shortTandemRepeat)}
           genotypeDistribution={getSelectedGenotypeDistribution(shortTandemRepeat, {
             selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
             selectedAncestryGroup,
+            selectedSex,
           })}
           xRanges={
             (selectedGenotypeDistributionRepeatUnits === '' &&
               allRepeatUnitsFoundInGnomadArePathogenic) ||
             ((allRepeatUnitsByClassification as any).pathogenic || []).includes(
-              selectedGenotypeDistributionRepeatUnits.split(' / ')[0]
+              selectedGenotypeDistributionRepeatUnits[0]
             )
               ? plotRanges
               : []
@@ -474,7 +461,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
             (selectedGenotypeDistributionRepeatUnits === '' &&
               allRepeatUnitsFoundInGnomadArePathogenic) ||
             ((allRepeatUnitsByClassification as any).pathogenic || []).includes(
-              selectedGenotypeDistributionRepeatUnits.split(' / ')[1]
+              selectedGenotypeDistributionRepeatUnits[1]
             )
               ? plotRanges
               : []
@@ -496,9 +483,8 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           />
           <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
             shortTandemRepeatOrAdjacentRepeat={shortTandemRepeat}
-            repunitPairs={genotypeDistributionRepunitPairs}
-            value={selectedGenotypeDistributionRepeatUnits}
-            onChange={setSelectedGenotypeDistributionRepeatUnits}
+            selectedRepeatUnits={selectedGenotypeDistributionRepeatUnits}
+            setSelectedRepeatUnits={setSelectedGenotypeDistributionRepeatUnits}
           />
         </ControlSection>
         {shortTandemRepeat.associated_diseases.length > 1 && (
@@ -529,11 +515,9 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
 
         {((selectedGenotypeDistributionRepeatUnits === '' &&
           !allRepeatUnitsFoundInGnomadArePathogenic) ||
-          !selectedGenotypeDistributionRepeatUnits
-            .split(' / ')
-            .every((repeatUnit) =>
-              ((allRepeatUnitsByClassification as any).pathogenic || []).includes(repeatUnit)
-            )) && (
+          !(selectedGenotypeDistributionRepeatUnits as string[]).every((repeatUnit) =>
+            ((allRepeatUnitsByClassification as any).pathogenic || []).includes(repeatUnit)
+          )) && (
           <p style={{ marginBottom: 0 }}>
             <Badge level="info">Note</Badge> This plot includes non-pathogenic repeat units. Use the
             &ldquo;Repeat units&rdquo; menu to view specific repeat units.
@@ -553,9 +537,11 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         >
           <ShortTandemRepeatGenotypeDistributionBinDetails
             shortTandemRepeatOrAdjacentRepeat={shortTandemRepeat}
-            selectedPopulationId={selectedAncestryGroup}
-            selectedRepeatUnits={selectedGenotypeDistributionRepeatUnits}
             bin={selectedGenotypeDistributionBin}
+            selectedRepeatUnits={selectedGenotypeDistributionRepeatUnits}
+            selectedAncestryGroup={selectedAncestryGroup}
+            selectedSex={selectedSex}
+            repeatUnitPairs={genotypeDistributionRepunitPairs}
           />
         </Modal>
       )}
@@ -566,7 +552,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         </h2>
         <ShortTandemRepeatAgeDistributionPlot
           ageDistribution={shortTandemRepeat.age_distribution}
-          maxRepeats={maxAlleleSizeDistributionRepeats}
+          maxRepeats={maxAlleleRepeats}
           ranges={allRepeatUnitsFoundInGnomadArePathogenic ? plotRanges : []}
         />
         {!allRepeatUnitsFoundInGnomadArePathogenic && (
@@ -587,10 +573,15 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
                 <ShortTandemRepeatAdjacentRepeatSection
                   key={adjacentRepeat.id}
                   adjacentRepeat={adjacentRepeat}
-                  selectedPopulationId={selectedAncestryGroup}
-                  onSelectPopulationId={setSelectedAncestryGroup}
+                  ancestryGroups={ancestryGroups}
+                  selectedAncestryGroup={selectedAncestryGroup}
+                  selectedSex={selectedSex}
                   selectedScaleType={selectedScaleType}
-                  onSelectScaleType={setSelectedScaleType}
+                  selectedGenotypeDistributionBin={selectedGenotypeDistributionBin}
+                  setSelectedAncestryGroup={setSelectedAncestryGroup}
+                  setSelectedSex={setSelectedSex}
+                  setSelectedScaleType={setSelectedScaleType}
+                  setSelectedGenotypeDistributionBin={setSelectedGenotypeDistributionBin}
                 />
               )
             })
@@ -612,7 +603,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           Read Data{' '}
           <InfoButton
             topic={
-              shortTandemRepeat.allele_size_distribution.repeat_units.length > 1
+              alleleSizeDistributionRepunits.length > 1
                 ? 'str-read-data-multiple-repeat-units'
                 : 'str-read-data'
             }
@@ -631,9 +622,9 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         <ShortTandemRepeatReads
           datasetId={datasetId}
           shortTandemRepeat={shortTandemRepeat}
-          filter={{
-            ...parseCombinedPopulationId(selectedAncestryGroup),
-          }}
+          maxRepeats={maxAlleleRepeats}
+          alleleSizeDistributionRepeatUnits={alleleSizeDistributionRepunits}
+          filter={{ population: selectedAncestryGroup, sex: selectedSex }}
         />
       </section>
     </>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
index 4cf2e151d..a874706dd 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
@@ -3,7 +3,10 @@ import styled from 'styled-components'
 
 import { Button, Input, Select } from '@gnomad/ui'
 
-import { GNOMAD_POPULATION_NAMES } from '@gnomad/dataset-metadata/gnomadPopulations'
+import {
+  GNOMAD_POPULATION_NAMES,
+  AncestryGroupId,
+} from '@gnomad/dataset-metadata/gnomadPopulations'
 
 import AttributeList, { AttributeListItem } from '../AttributeList'
 import Delayed from '../Delayed'
@@ -43,7 +46,7 @@ type ShortTandemRepeatReadProps = {
         lower: number
       }
     }[]
-    population: string
+    population: AncestryGroupId
     sex: string
     age?: string
     pcr_protocol: string
@@ -58,7 +61,6 @@ const ShortTandemRepeatRead = ({ read }: ShortTandemRepeatReadProps) => {
     <div>
       <AttributeList style={{ marginBottom: '1em' }}>
         <AttributeListItem label="Population">
-          {/* @ts-expect-error TS(7053) FIXME: Element implicitly has an 'any' type because expre... Remove this comment to see the full error message */}
           {GNOMAD_POPULATION_NAMES[read.population]}
         </AttributeListItem>
         <AttributeListItem label="Sex">{read.sex}</AttributeListItem>
@@ -117,11 +119,10 @@ const ShortTandemRepeatReadContainer = ({
     )
   }
 
-  if (error) {
+  if (error || !read) {
     return <StatusMessage>Unable to load read</StatusMessage>
   }
 
-  // @ts-expect-error TS(2322) FIXME: Type 'null' is not assignable to type '{ alleles: ... Remove this comment to see the full error message
   return <ShortTandemRepeatRead read={read} />
 }
 
@@ -194,15 +195,7 @@ const fetchReads = ({ datasetId, shortTandemRepeatId, filter, limit, offset }: a
 type ShortTandemRepeatReadsProps = {
   datasetId: string
   shortTandemRepeat: ShortTandemRepeat
-  filter: {
-    population?: string
-    sex?: string
-    alleles?: {
-      repeat_unit?: string
-      min_repeats?: number
-      max_repeat?: number
-    }[]
-  }
+  filter: Filters
 }
 
 const ShortTandemRepeatReads = ({
@@ -210,12 +203,12 @@ const ShortTandemRepeatReads = ({
   shortTandemRepeat,
   filter,
 }: ShortTandemRepeatReadsProps) => {
-  const fetchReadsTimer = useRef(null)
+  const fetchReadsTimer = useRef<ReturnType<typeof setTimeout> | null>(null)
   const fetchNumReadsMemoized = useCallback(() => {
-    // @ts-expect-error TS(2769) FIXME: No overload matches this call.
-    clearTimeout(fetchReadsTimer.current)
+    if (fetchReadsTimer.current) {
+      clearTimeout(fetchReadsTimer.current)
+    }
     return new Promise((resolve: any, reject: any) => {
-      // @ts-expect-error TS(2322) FIXME: Type 'Timeout' is not assignable to type 'null'.
       fetchReadsTimer.current = setTimeout(() => {
         fetchNumReads({ datasetId, shortTandemRepeatId: shortTandemRepeat.id, filter }).then(
           resolve,
@@ -224,8 +217,8 @@ const ShortTandemRepeatReads = ({
       }, 300)
     })
   }, [datasetId, shortTandemRepeat, filter])
-  const { isLoading, response: numReads, error } = useRequest(fetchNumReadsMemoized)
-
+  const { isLoading, response, error } = useRequest(fetchNumReadsMemoized)
+  const numReads: number = (response as unknown as { numReads: number }).numReads
   const readsStore = useRef(new Map())
   const [readIndex, setReadIndex] = useState(0)
 
@@ -307,18 +300,15 @@ const ShortTandemRepeatReads = ({
             min={1}
             max={numReads}
             onChange={(e: any) => {
-              // @ts-expect-error TS(2531) FIXME: Object is possibly 'null'.
-              setReadIndex(Math.max(0, Math.min(numReads - 1, Number(e.target.value) - 1)))
+              setReadIndex(Math.max(0, Math.min(numReads! - 1, Number(e.target.value) - 1)))
             }}
             style={{ width: '10ch' }}
           />{' '}
-          {/* @ts-expect-error TS(2531) FIXME: Object is possibly 'null'. */}
-          of {numReads.toLocaleString()}
+          of {numReads!.toLocaleString()}
         </span>
 
         <Button
           onClick={() => {
-            // @ts-expect-error TS(2531) FIXME: Object is possibly 'null'.
             if (readIndex < numReads - 1) {
               setReadIndex((previousReadIndex) => previousReadIndex + 1)
             }
@@ -351,23 +341,21 @@ const ShortTandemRepeatReadsAllelesFilterControlWrapper = styled.div`
 type ShortTandemRepeatReadsAllelesFilterControlsProps = {
   shortTandemRepeat: ShortTandemRepeat
   value: {
-    repeat_unit?: string
-    min_repeats?: number
-    max_repeats?: number
+    repeat_unit: string | null
+    min_repeats: number | null
+    max_repeats: number | null
   }[]
+  maxRepeats: number
   onChange: (...args: any[]) => any
+  alleleSizeDistributionRepeatUnits: string[]
 }
 
 const ShortTandemRepeatReadsAllelesFilterControls = ({
-  shortTandemRepeat,
   value,
+  maxRepeats,
   onChange,
+  alleleSizeDistributionRepeatUnits,
 }: ShortTandemRepeatReadsAllelesFilterControlsProps) => {
-  const maxNumRepeats =
-    shortTandemRepeat.allele_size_distribution.distribution[
-      shortTandemRepeat.allele_size_distribution.distribution.length - 1
-    ][0]
-
   return (
     <ShortTandemRepeatReadsAllelesFilterControlsWrapper>
       {[0, 1].map((alleleIndex) => (
@@ -387,12 +375,10 @@ const ShortTandemRepeatReadsAllelesFilterControls = ({
                 )
               }}
             >
-              {shortTandemRepeat.allele_size_distribution.repeat_units.length > 1 && (
-                <option value="">Any</option>
-              )}
-              {shortTandemRepeat.allele_size_distribution.repeat_units.map((repeatUnit) => (
-                <option key={repeatUnit.repeat_unit} value={repeatUnit.repeat_unit}>
-                  {repeatUnit.repeat_unit}
+              {alleleSizeDistributionRepeatUnits.length > 1 && <option value="">Any</option>}
+              {alleleSizeDistributionRepeatUnits.map((repeatUnit) => (
+                <option key={repeatUnit} value={repeatUnit}>
+                  {repeatUnit}
                 </option>
               ))}
             </Select>
@@ -403,10 +389,10 @@ const ShortTandemRepeatReadsAllelesFilterControls = ({
               type="number"
               id={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-min-repeats`}
               min={0}
-              max={maxNumRepeats}
+              max={maxRepeats}
               value={value[alleleIndex].min_repeats}
               onChange={(e: any) => {
-                const newMinRepeats = Math.max(Math.min(Number(e.target.value), maxNumRepeats), 0)
+                const newMinRepeats = Math.max(Math.min(Number(e.target.value), maxRepeats), 0)
                 onChange(
                   value.map((v, i) =>
                     i === alleleIndex ? { ...v, min_repeats: newMinRepeats } : v
@@ -421,10 +407,10 @@ const ShortTandemRepeatReadsAllelesFilterControls = ({
               type="number"
               id={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-max-repeats`}
               min={0}
-              max={maxNumRepeats}
+              max={maxRepeats}
               value={value[alleleIndex].max_repeats}
               onChange={(e: any) => {
-                const newMaxRepeats = Math.max(Math.min(Number(e.target.value), maxNumRepeats), 0)
+                const newMaxRepeats = Math.max(Math.min(Number(e.target.value), maxRepeats), 0)
                 onChange(
                   value.map((v, i) =>
                     i === alleleIndex ? { ...v, max_repeats: newMaxRepeats } : v
@@ -440,54 +426,56 @@ const ShortTandemRepeatReadsAllelesFilterControls = ({
   )
 }
 
+type Filters = {
+  population: string | null
+  sex: string | null
+  alleles:
+    | {
+        repeat_unit: string | null
+        min_repeats: number | null
+        max_repeats: number | null
+      }[]
+    | null
+}
+
 type ShortTandemRepeatReadsContainerProps = {
   datasetId: string
   shortTandemRepeat: ShortTandemRepeat
-  filter: {
-    population?: string
-    sex?: string
-    alleles?: {
-      repeat_unit?: string
-      min_repeats?: number
-      max_repeats?: number
-    }[]
-  }
+  filter: Omit<Filters, 'alleles'>
+  maxRepeats: number
+  alleleSizeDistributionRepeatUnits: string[]
 }
 
 const ShortTandemRepeatReadsContainer = ({
   datasetId,
   shortTandemRepeat,
+  maxRepeats,
+  alleleSizeDistributionRepeatUnits,
   filter: baseFilter,
 }: ShortTandemRepeatReadsContainerProps) => {
-  const maxNumRepeats =
-    shortTandemRepeat.allele_size_distribution.distribution[
-      shortTandemRepeat.allele_size_distribution.distribution.length - 1
-    ][0]
-
-  const [filter, setFilter] = useState({
+  const [filter, setFilter] = useState<Filters>({
     ...baseFilter,
     alleles: [
       {
         repeat_unit:
-          shortTandemRepeat.allele_size_distribution.repeat_units.length > 1
+          alleleSizeDistributionRepeatUnits.length > 1
             ? null
-            : shortTandemRepeat.allele_size_distribution.repeat_units[0].repeat_unit,
+            : alleleSizeDistributionRepeatUnits[0],
         min_repeats: 0,
-        max_repeats: maxNumRepeats,
+        max_repeats: maxRepeats,
       },
       {
         repeat_unit:
-          shortTandemRepeat.allele_size_distribution.repeat_units.length > 1
+          alleleSizeDistributionRepeatUnits.length > 1
             ? null
-            : shortTandemRepeat.allele_size_distribution.repeat_units[0].repeat_unit,
+            : alleleSizeDistributionRepeatUnits[0],
         min_repeats: 0,
-        max_repeats: maxNumRepeats,
+        max_repeats: maxRepeats,
       },
     ],
   })
 
   if (baseFilter.population !== filter.population || baseFilter.sex !== filter.sex) {
-    // @ts-expect-error TS(2345) FIXME: Argument of type '{ population?: string | undefine... Remove this comment to see the full error message
     setFilter({
       ...filter,
       ...baseFilter,
@@ -498,16 +486,16 @@ const ShortTandemRepeatReadsContainer = ({
     <>
       <ShortTandemRepeatReadsAllelesFilterControls
         shortTandemRepeat={shortTandemRepeat}
-        // @ts-expect-error TS(2322) FIXME: Type '{ repeat_unit: string | null; min_repeats: n... Remove this comment to see the full error message
-        value={filter.alleles}
+        value={filter.alleles || []}
         onChange={(newAllelesFilter) => {
           setFilter((prevFilter) => ({ ...prevFilter, alleles: newAllelesFilter }))
         }}
+        maxRepeats={maxRepeats}
+        alleleSizeDistributionRepeatUnits={alleleSizeDistributionRepeatUnits}
       />
       <ShortTandemRepeatReads
         datasetId={datasetId}
         shortTandemRepeat={shortTandemRepeat}
-        // @ts-expect-error TS(2322) FIXME: Type '{ alleles: { repeat_unit: string | null; min... Remove this comment to see the full error message
         filter={filter}
       />
     </>
diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index b13d0b50f..6e7b99abf 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -3,6 +3,9 @@ import {
   ShortTandemRepeat,
   AlleleSizeDistributionItem,
   AlleleSizeDistributionCohort,
+  GenotypeDistributionCohort,
+  GenotypeDistributionItem,
+  ShortTandemRepeatAdjacentRepeat,
 } from './ShortTandemRepeatPage'
 import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
@@ -12,7 +15,7 @@ type AlleleSizeDistributionFilters = {
   selectedRepeatUnit: string
 }
 
-const addCohortToDistribution = (
+const addCohortToAlleleSizeDistribution = (
   cohort: AlleleSizeDistributionCohort,
   distribution: Record<number, AlleleSizeDistributionItem>
 ): Record<number, AlleleSizeDistributionItem> =>
@@ -28,7 +31,7 @@ const addCohortToDistribution = (
   }, distribution)
 
 export const getSelectedAlleleSizeDistribution = (
-  shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat,
+  shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat,
   { selectedAncestryGroup, selectedSex, selectedRepeatUnit }: AlleleSizeDistributionFilters
 ): AlleleSizeDistributionItem[] => {
   // TK figure out what's up with classification
@@ -43,7 +46,7 @@ export const getSelectedAlleleSizeDistribution = (
       if (cohort.repunit !== selectedRepeatUnit) {
         return acc
       }
-      return addCohortToDistribution(cohort, acc)
+      return addCohortToAlleleSizeDistribution(cohort, acc)
     }, {} as Record<number, AlleleSizeDistributionItem>)
   return Object.values(itemsByRepunitCount)
 }
@@ -93,10 +96,56 @@ export const getSelectedAlleleSizeDistribution = (
   return shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.distribution
 }*/
 
+const addCohortToGenotypeDistribution = (
+  cohort: GenotypeDistributionCohort,
+  distribution: Record<string, GenotypeDistributionItem>
+): Record<number, GenotypeDistributionItem> =>
+  cohort.distribution.reduce((acc, distributionItem) => {
+    const { short_allele_repunit_count, long_allele_repunit_count } = distributionItem
+    const key = [short_allele_repunit_count, long_allele_repunit_count].join(' / ')
+    const existingItem = acc[key]
+    const countSoFar = existingItem ? existingItem.frequency : 0
+    const newItem: GenotypeDistributionItem = {
+      short_allele_repunit_count: short_allele_repunit_count,
+      long_allele_repunit_count: long_allele_repunit_count,
+      frequency: countSoFar + distributionItem.frequency,
+    }
+    return { ...acc, [key]: newItem }
+  }, distribution)
+
 export const getSelectedGenotypeDistribution = (
-  shortTandemRepeatOrAdjacentRepeat: any,
-  { selectedRepeatUnits, selectedPopulationId }: any
-) => {
+  shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat,
+  {
+    selectedRepeatUnits,
+    selectedAncestryGroup,
+    selectedSex,
+  }: {
+    selectedRepeatUnits: string[] | ''
+    selectedAncestryGroup: AncestryGroupId | ''
+    selectedSex: Sex | ''
+  }
+): GenotypeDistributionItem[] => {
+  const itemsByRepunitCounts: Record<string, GenotypeDistributionItem> =
+    shortTandemRepeatOrAdjacentRepeat.genotype_distribution.reduce((acc, cohort) => {
+      if (selectedAncestryGroup !== '' && cohort.ancestry_group !== selectedAncestryGroup) {
+        return acc
+      }
+      if (selectedSex !== '' && cohort.sex !== selectedSex) {
+        return acc
+      }
+      if (
+        selectedRepeatUnits !== '' &&
+        (cohort.short_allele_repunit !== selectedRepeatUnits[0] ||
+          cohort.long_allele_repunit !== selectedRepeatUnits[1])
+      ) {
+        return acc
+      }
+      return addCohortToGenotypeDistribution(cohort, acc)
+    }, {})
+  return Object.values(itemsByRepunitCounts)
+}
+
+/* {
   const baseDistribution = selectedRepeatUnits
     ? shortTandemRepeatOrAdjacentRepeat.genotype_distribution.repeat_units.find(
         (repeatUnit: any) => repeatUnit.repeat_units.join(' / ') === selectedRepeatUnits
@@ -113,7 +162,7 @@ export const getSelectedGenotypeDistribution = (
     selectedRepeatUnits.split(' / ')[0] === selectedRepeatUnits.split(' / ')[1]
     ? selectedDistribution.map((d: any) => (d[0] >= d[1] ? d : [d[1], d[0], d[2]]))
     : selectedDistribution
-}
+}*/
 
 export const getGenotypeDistributionPlotAxisLabels = (
   shortTandemRepeatOrAdjacentRepeat: any,
@@ -130,3 +179,42 @@ export const getGenotypeDistributionPlotAxisLabels = (
   }
   return ['longer allele', 'shorter allele']
 }
+
+export const maxAlleleSizeDistributionRepeats = (
+  shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
+) =>
+  Math.max(
+    ...shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.flatMap((cohort) =>
+      cohort.distribution.map((item) => item.repunit_count)
+    )
+  )
+
+export const maxGenotypeDistributionRepeats = (
+  shortTandemRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
+): [number, number] => {
+  const { genotype_distribution } = shortTandemRepeat
+  const longAlleleCounts = genotype_distribution.flatMap((cohort) =>
+    cohort.distribution.map((item) => item.long_allele_repunit_count)
+  )
+  const shortAlleleCounts = genotype_distribution.flatMap((cohort) =>
+    cohort.distribution.map((item) => item.short_allele_repunit_count)
+  )
+  return [Math.max(...longAlleleCounts), Math.max(...shortAlleleCounts)]
+}
+
+export const genotypeRepunitPairs = (
+  shortTandemRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
+): string[][] => {
+  // Lists being pass-by-reference rather than by value, we can't just get the distinct pairs by the trick of turning a list into a Set back into a list, as we do for allele-size distribution repunits. Hence this implementation.
+  const pairsByKey: Record<string, string[]> = shortTandemRepeat.genotype_distribution.reduce(
+    (acc, { short_allele_repunit, long_allele_repunit }) => {
+      const pair = [short_allele_repunit, long_allele_repunit]
+      const key = pair.join(' / ')
+      return { ...acc, [key]: pair }
+    },
+    {} as Record<string, string[]>
+  )
+  return Object.values(pairsByKey).sort(
+    (a, b) => a[0].localeCompare(b[0]) || a[1].localeCompare(b[1])
+  )
+}

From 24eb72aec7d918d793073475438573c5e289a31f Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Thu, 25 Jul 2024 14:02:51 -0400
Subject: [PATCH 09/36] WIP typechecks

---
 ...ShortTandemRepeatAdjacentRepeatSection.tsx | 18 +++++-
 .../ShortTandemRepeatAttributes.tsx           | 12 ++--
 ...emRepeatGenotypeDistributionBinDetails.tsx | 61 ++++++++++++-------
 .../ShortTandemRepeatPage.tsx                 | 30 ++++++---
 .../src/__factories__/ShortTandemRepeat.ts    | 51 +++++++++++++---
 5 files changed, 124 insertions(+), 48 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
index db9900076..d31d89cef 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
@@ -15,6 +15,7 @@ import {
   getSelectedAlleleSizeDistribution,
   getSelectedGenotypeDistribution,
   getGenotypeDistributionPlotAxisLabels,
+  genotypeRepunitPairs,
   maxAlleleSizeDistributionRepeats,
   maxGenotypeDistributionRepeats,
 } from './shortTandemRepeatHelpers'
@@ -47,8 +48,12 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
   const [selectedRepeatUnit, setSelectedRepeatUnit] = useState(
     adjacentRepeat.repeat_units.length === 1 ? adjacentRepeat.repeat_units[0] : ''
   )
+
+  const genotypeDistributionPairs = genotypeRepunitPairs(adjacentRepeat)
+  const defaultGenotypeDistributionRepeatUnits =
+    genotypeDistributionPairs.length === 1 ? genotypeDistributionPairs[0] : ''
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
-    useState<string>(defaultGenotypeDistributionRepeatUnits)
+    useState<string[] | ''>(defaultGenotypeDistributionRepeatUnits)
 
   const [selectedGenotypeDistributionBin, setSelectedGenotypeDistributionBin] = useState(null)
 
@@ -122,12 +127,16 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
         maxRepeats={maxGenotypeDistributionRepeats(adjacentRepeat)}
         genotypeDistribution={getSelectedGenotypeDistribution(adjacentRepeat, {
           selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
+          selectedAncestryGroup: selectedAncestryGroup,
+          selectedSex: selectedSex,
         })}
         onSelectBin={(bin: any) => {
           if (bin.xRange[0] !== bin.xRange[1] || bin.yRange[0] !== bin.yRange[1]) {
             setSelectedGenotypeDistributionBin(bin)
           }
         }}
+        xRanges={[]}
+        yRanges={[]}
       />
 
       <ControlSection>
@@ -142,8 +151,8 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
 
         <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
           shortTandemRepeatOrAdjacentRepeat={adjacentRepeat}
-          value={selectedGenotypeDistributionRepeatUnits}
-          onChange={setSelectedGenotypeDistributionRepeatUnits}
+          selectedRepeatUnits={selectedGenotypeDistributionRepeatUnits}
+          setSelectedRepeatUnits={setSelectedGenotypeDistributionRepeatUnits}
         />
       </ControlSection>
 
@@ -161,6 +170,9 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
             shortTandemRepeatOrAdjacentRepeat={adjacentRepeat}
             selectedRepeatUnits={selectedGenotypeDistributionRepeatUnits}
             bin={selectedGenotypeDistributionBin}
+            selectedAncestryGroup={selectedAncestryGroup}
+            selectedSex={selectedSex}
+            repeatUnitPairs={genotypeDistributionPairs}
           />
         </Modal>
       )}
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx
index ec8457f4f..7c2ecb89c 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx
@@ -11,14 +11,11 @@ type ShortTandemRepeatRepeatUnitsProps = {
 }
 
 const ShortTandemRepeatRepeatUnits = ({ shortTandemRepeat }: ShortTandemRepeatRepeatUnitsProps) => {
-  const repeatUnitsByClassification = {}
+  const repeatUnitsByClassification: Record<string, string[]> = {}
   shortTandemRepeat.repeat_units.forEach((repeatUnit) => {
-    // @ts-expect-error TS(7053) FIXME: Element implicitly has an 'any' type because expre... Remove this comment to see the full error message
     if (repeatUnitsByClassification[repeatUnit.classification] === undefined) {
-      // @ts-expect-error TS(7053) FIXME: Element implicitly has an 'any' type because expre... Remove this comment to see the full error message
       repeatUnitsByClassification[repeatUnit.classification] = []
     }
-    // @ts-expect-error TS(7053) FIXME: Element implicitly has an 'any' type because expre... Remove this comment to see the full error message
     repeatUnitsByClassification[repeatUnit.classification].push(repeatUnit.repeat_unit)
   })
 
@@ -132,10 +129,11 @@ const ShortTandemRepeatAttributes = ({ shortTandemRepeat }: ShortTandemRepeatAtt
       <AttributeListItem label="Gene region">{shortTandemRepeat.gene.region}</AttributeListItem>
       <AttributeListItem label="Reference region">
         <Link
-          to={`/region/${shortTandemRepeat.reference_region.chrom}-${shortTandemRepeat.reference_region.start}-${shortTandemRepeat.reference_region.stop}`}
+          to={`/region/${shortTandemRepeat.main_reference_region.chrom}-${shortTandemRepeat.main_reference_region.start}-${shortTandemRepeat.main_reference_region.stop}`}
         >
-          {shortTandemRepeat.reference_region.chrom}-{shortTandemRepeat.reference_region.start}-
-          {shortTandemRepeat.reference_region.stop}
+          {shortTandemRepeat.main_reference_region.chrom}-
+          {shortTandemRepeat.main_reference_region.start}-
+          {shortTandemRepeat.main_reference_region.stop}
         </Link>
       </AttributeListItem>
       <ShortTandemRepeatRepeatUnits shortTandemRepeat={shortTandemRepeat} />
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
index 3619fde9f..00ad37ee7 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
@@ -2,7 +2,12 @@ import React from 'react'
 
 import { List, ListItem } from '@gnomad/ui'
 
-import { ShortTandemRepeat, ShortTandemRepeatAdjacentRepeat, Sex } from './ShortTandemRepeatPage'
+import {
+  ShortTandemRepeat,
+  ShortTandemRepeatAdjacentRepeat,
+  Sex,
+  GenotypeDistributionItem,
+} from './ShortTandemRepeatPage'
 import { getSelectedGenotypeDistribution } from './shortTandemRepeatHelpers'
 import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
@@ -33,20 +38,25 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
     selectedSex,
   })
 
-  const isInBin = (d: any) =>
-    bin.xRange[0] <= d[0] && d[0] <= bin.xRange[1] && bin.yRange[0] <= d[1] && d[1] <= bin.yRange[1]
+  const isInBin = (item: GenotypeDistributionItem) =>
+    bin.xRange[0] <= item.long_allele_repunit_count &&
+    item.long_allele_repunit_count <= bin.xRange[1] &&
+    bin.yRange[0] <= item.short_allele_repunit_count &&
+    item.short_allele_repunit_count <= bin.yRange[1]
 
   return (
     <>
       {/* @ts-expect-error TS(2745) FIXME: This JSX tag's 'children' prop expects type 'never... Remove this comment to see the full error message */}
       <List>
-        {/* @ts-expect-error TS(7031) FIXME: Binding element 'x' implicitly has an 'any' type. */}
-        {genotypeDistribution.filter(isInBin).map(([x, y, n]) => (
-          // @ts-expect-error TS(2769) FIXME: No overload matches this call.
-          <ListItem key={`${x}/${y}`}>
-            {x} repeats / {y} repeats: {n} individuals
-          </ListItem>
-        ))}
+        {genotypeDistribution
+          .filter(isInBin)
+          .map(({ long_allele_repunit_count, short_allele_repunit_count, frequency }) => (
+            // @ts-expect-error TS(2769) FIXME: No overload matches this call.
+            <ListItem key={`${long_allele_repunit_count}/${short_allele_repunit_count}`}>
+              {long_allele_repunit_count} repeats / {short_allele_repunit_count} repeats:{' '}
+              {frequency} individuals
+            </ListItem>
+          ))}
       </List>
       {!selectedRepeatUnits && (
         <>
@@ -62,7 +72,7 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
                   selectedRepeatUnits: repeatUnits,
                 }),
               }))
-              .flatMap(({ repeatUnits, distribution }: any) => [
+              .flatMap(({ repeatUnits, distribution }) => [
                 {
                   repeatUnits,
                   distribution: distribution.filter((d: any) => d[0] >= d[1]).filter(isInBin),
@@ -70,25 +80,32 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
                 {
                   repeatUnits: [...repeatUnits].reverse(),
                   distribution: distribution
-                    .filter((d: any) => d[0] < d[1])
-                    .map((d: any) => [d[1], d[0], d[2]])
+                    .filter((d) => d.long_allele_repunit_count < d.short_allele_repunit_count)
+                    .map((d) => ({
+                      ...d,
+                      long_allele_repunit_count: d.short_allele_repunit_count,
+                      short_allele_repunit_count: d.long_allele_repunit_count,
+                    }))
                     .filter(isInBin),
                 },
               ])
-              .filter(({ distribution }: any) => distribution.length > 0)
-              .map(({ repeatUnits, distribution }: any) => (
+              .map(({ repeatUnits, distribution }) => (
                 // @ts-expect-error TS(2769) FIXME: No overload matches this call.
                 <ListItem key={repeatUnits.join('/')}>
                   {repeatUnits.join(' / ')}
                   {/* @ts-expect-error TS(2745) FIXME: This JSX tag's 'children' prop expects type 'never... Remove this comment to see the full error message */}
                   <List>
-                    {/* @ts-expect-error TS(7031) FIXME: Binding element 'x' implicitly has an 'any' type. */}
-                    {distribution.map(([x, y, n]) => (
-                      // @ts-expect-error TS(2769) FIXME: No overload matches this call.
-                      <ListItem key={`${x}/${y}`}>
-                        {x} repeats / {y} repeats: {n} individuals
-                      </ListItem>
-                    ))}
+                    {distribution.map(
+                      ({ short_allele_repunit_count, long_allele_repunit_count, frequency }) => (
+                        // @ts-expect-error TS(2769) FIXME: No overload matches this call.
+                        <ListItem
+                          key={`${long_allele_repunit_count}/${short_allele_repunit_count}`}
+                        >
+                          {long_allele_repunit_count} repeats / {short_allele_repunit_count}{' '}
+                          repeats: {frequency} individuals
+                        </ListItem>
+                      )
+                    )}
                   </List>
                 </ListItem>
               ))}
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 77727ceaa..715b6b465 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -221,6 +221,18 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
     useState<GenotypeBin | null>(null)
 
   const maxAlleleRepeats = maxAlleleSizeDistributionRepeats(shortTandemRepeat)
+
+  const isRepunitSelectionPathogenic = (
+    selectedRepeatUnits: string[] | '',
+    allRepeatUnitsFoundInGnomadArePathogenic: boolean,
+    allRepeatUnitsByClassification: Record<string, string[]>,
+    selectionIndex: number
+  ) =>
+    (selectedRepeatUnits === '' && allRepeatUnitsFoundInGnomadArePathogenic) ||
+    (allRepeatUnitsByClassification.pathogenic || []).includes(
+      selectedGenotypeDistributionRepeatUnits[selectionIndex]
+    )
+
   return (
     <>
       <FlexWrapper style={{ marginBottom: '3em' }}>
@@ -449,19 +461,21 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
             selectedSex,
           })}
           xRanges={
-            (selectedGenotypeDistributionRepeatUnits === '' &&
-              allRepeatUnitsFoundInGnomadArePathogenic) ||
-            ((allRepeatUnitsByClassification as any).pathogenic || []).includes(
-              selectedGenotypeDistributionRepeatUnits[0]
+            isRepunitSelectionPathogenic(
+              selectedGenotypeDistributionRepeatUnits,
+              allRepeatUnitsFoundInGnomadArePathogenic,
+              allRepeatUnitsByClassification,
+              0
             )
               ? plotRanges
               : []
           }
           yRanges={
-            (selectedGenotypeDistributionRepeatUnits === '' &&
-              allRepeatUnitsFoundInGnomadArePathogenic) ||
-            ((allRepeatUnitsByClassification as any).pathogenic || []).includes(
-              selectedGenotypeDistributionRepeatUnits[1]
+            isRepunitSelectionPathogenic(
+              selectedGenotypeDistributionRepeatUnits,
+              allRepeatUnitsFoundInGnomadArePathogenic,
+              allRepeatUnitsByClassification,
+              1
             )
               ? plotRanges
               : []
diff --git a/browser/src/__factories__/ShortTandemRepeat.ts b/browser/src/__factories__/ShortTandemRepeat.ts
index c2d8ff741..81f0d59a9 100644
--- a/browser/src/__factories__/ShortTandemRepeat.ts
+++ b/browser/src/__factories__/ShortTandemRepeat.ts
@@ -27,24 +27,59 @@ const shortTandemRepeatFactory = Factory.define<ShortTandemRepeat>(({ params, as
         notes: 'hello world',
       },
     ],
-    reference_region = { chrom: '1', start: 10000000, stop: 15000000 },
-    allele_size_distribution = {
-      distribution: [[1, 1]],
-      populations: [],
-      repeat_units: [],
-    },
-    genotype_distribution = { distribution: [], populations: [], repeat_units: [] },
+    main_reference_region = { chrom: '1', start: 10000000, stop: 15000000 },
+    reference_regions = [{ chrom: '1', start: 10000000, stop: 15000000 }],
+    allele_size_distribution = [
+      {
+        ancestry_group: 'asj',
+        sex: 'XY',
+        repunit: 'ACCA',
+        quality_description: 'medium-low',
+        q_score: 0.6,
+        distribution: [
+          { repunit_count: 3, frequency: 12 },
+          { repunit_count: 4, frequency: 123 },
+        ],
+      },
+    ],
+    genotype_distribution = [
+      {
+        ancestry_group: 'asj',
+        sex: 'XY',
+        short_allele_repunit: 'ACCA',
+        long_allele_repunit: 'GATA',
+        quality_description: 'high',
+        q_score: 1.0,
+        distribution: [
+          { short_allele_repunit_count: 8, long_allele_repunit_count: 9, frequency: 15 },
+          { short_allele_repunit_count: 8, long_allele_repunit_count: 10, frequency: 19 },
+          { short_allele_repunit_count: 9, long_allele_repunit_count: 10, frequency: 17 },
+        ],
+      },
+    ],
+    age_distribution = [
+      {
+        age_range: [null, 18],
+        distribution: [
+          [8, 6],
+          [9, 3],
+          [10, 9],
+        ],
+      },
+    ],
   } = associations
 
   return {
     id,
     gene,
     associated_diseases,
-    reference_region,
+    main_reference_region,
+    reference_regions,
     reference_repeat_unit,
     repeat_units,
     allele_size_distribution,
     genotype_distribution,
+    age_distribution,
     stripy_id,
     adjacent_repeats,
   }

From 678272d6a31525515e29e257879701dc092dc3d9 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Fri, 26 Jul 2024 11:19:22 -0400
Subject: [PATCH 10/36] WIP flush any's, flush bugs

---
 .../ShortTandemRepeatAdjacentRepeatSection.tsx   | 11 ++++++-----
 .../ShortTandemRepeatAgeDistributionPlot.tsx     | 12 ++++++------
 ...ortTandemRepeatAlleleSizeDistributionPlot.tsx | 16 ++++++++--------
 .../ShortTandemRepeatAttributes.tsx              |  8 ++++----
 ...andemRepeatGenotypeDistributionBinDetails.tsx |  4 +++-
 .../ShortTandemRepeatPage.tsx                    | 14 +++++++-------
 .../shortTandemRepeatHelpers.ts                  | 15 +++++++--------
 7 files changed, 41 insertions(+), 39 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
index d31d89cef..921dadb9d 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
@@ -55,7 +55,8 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
     useState<string[] | ''>(defaultGenotypeDistributionRepeatUnits)
 
-  const [selectedGenotypeDistributionBin, setSelectedGenotypeDistributionBin] = useState(null)
+  const [selectedGenotypeDistributionBin, setSelectedGenotypeDistributionBin] =
+    useState<GenotypeBin | null>(null)
 
   return (
     <section style={{ marginBottom: '3em' }}>
@@ -88,7 +89,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
           <Select
             id={`short-tandem-repeat-${adjacentRepeat.id}-repeat-unit`}
             value={selectedRepeatUnit}
-            onChange={(e: any) => {
+            onChange={(e: { target: { value: string } }) => {
               setSelectedRepeatUnit(e.target.value)
             }}
           >
@@ -109,7 +110,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
           <Select
             id={`short-tandem-repeat-${adjacentRepeat.id}-repeat-counts-scale`}
             value={selectedScaleType}
-            onChange={(e: any) => {
+            onChange={(e: { target: { value: ScaleType } }) => {
               setSelectedScaleType(e.target.value)
             }}
           >
@@ -130,7 +131,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
           selectedAncestryGroup: selectedAncestryGroup,
           selectedSex: selectedSex,
         })}
-        onSelectBin={(bin: any) => {
+        onSelectBin={(bin: GenotypeBin) => {
           if (bin.xRange[0] !== bin.xRange[1] || bin.yRange[0] !== bin.yRange[1]) {
             setSelectedGenotypeDistributionBin(bin)
           }
@@ -158,7 +159,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
 
       {selectedGenotypeDistributionBin && (
         <Modal
-          title={(selectedGenotypeDistributionBin as any).label}
+          title={selectedGenotypeDistributionBin.label}
           size="large"
           // @ts-expect-error TS(2322) FIXME: Type '{ children: Element; title: any; size: "larg... Remove this comment to see the full error message
           initialFocusOnButton={false}
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAgeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAgeDistributionPlot.tsx
index f93abbac4..c328be5e8 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAgeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAgeDistributionPlot.tsx
@@ -59,7 +59,7 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
 
     const yNumBins = ageDistribution.length
 
-    const data = Array.from(Array(xNumBins * yNumBins).keys()).map((n: any) => {
+    const data = Array.from(Array(xNumBins * yNumBins).keys()).map((n) => {
       const xBinIndex = Math.floor(n / yNumBins)
       const yBinIndex = n % yNumBins
 
@@ -102,7 +102,7 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
     const xMaxNumLabels = Math.floor(plotWidth / 20)
     const xLabelInterval = Math.max(Math.round(xNumBins / xMaxNumLabels), 1)
 
-    const xTickFormat = (binIndex: any) => {
+    const xTickFormat = (binIndex: number) => {
       if (binIndex % xLabelInterval !== 0) {
         return ''
       }
@@ -114,12 +114,12 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
       return `${binIndex * xBinSize} - ${binIndex * xBinSize + xBinSize - 1}`
     }
 
-    const yTickFormat = (binIndex: any) => {
+    const yTickFormat = (binIndex: number) => {
       return ageRangeLabel(ageDistribution[binIndex].age_range)
     }
 
     const opacityScale = scaleLog()
-      .domain([1, max(ageDistribution, (ageBin) => max(ageBin.distribution, (d: any) => d[1]))])
+      .domain([1, max(ageDistribution, (ageBin) => max(ageBin.distribution, (d) => d[1])) || 2])
       .range([0.1, 1])
 
     return (
@@ -178,8 +178,8 @@ const ShortTandemRepeatAgeDistributionPlot = withSize()(
 
           <g transform={`translate(${margin.left},${margin.top})`}>
             {data
-              .filter((d: any) => d.count !== 0)
-              .map((d: any) => {
+              .filter((d) => d.count !== 0)
+              .map((d) => {
                 return (
                   <React.Fragment key={`${d.xBinIndex}-${d.yBinIndex}`}>
                     <TooltipAnchor
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index a05f94760..755f946b7 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -78,7 +78,7 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
     const nBins = Math.floor(maxRepeats / binSize) + 1
 
     const data = useMemo(() => {
-      const d = Array.from(Array(nBins).keys()).map((n: any) => ({
+      const d = Array.from(Array(nBins).keys()).map((n) => ({
         binIndex: n,
         label: binSize === 1 ? `${n}` : `${n * binSize} - ${n * binSize + binSize - 1}`,
         count: 0,
@@ -93,20 +93,20 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
     }, [alleleSizeDistribution, nBins, binSize])
 
     const xScale = scaleBand<number>()
-      .domain(data.map((d: any) => d.binIndex))
+      .domain(data.map((d) => d.binIndex))
       .range([0, plotWidth])
 
     const xBandwidth = xScale.bandwidth()
 
     let yScale: any
     if (scaleType === 'log') {
-      const maxLog = Math.ceil(Math.log10(max(data, (d: any) => d.count) || 1))
+      const maxLog = Math.ceil(Math.log10(max(data, (d) => d.count) || 1))
       yScale = scaleLog()
         .domain([1, 10 ** maxLog])
         .range([plotHeight - 10, 0])
     } else {
       yScale = scaleLinear()
-        .domain([0, max(data, (d: any) => d.count) || 1])
+        .domain([0, max(data, (d) => d.count) || 1])
         .range([plotHeight, 0])
     }
 
@@ -199,7 +199,7 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
             />
           )}
           <g transform={`translate(${margin.left},${margin.top})`}>
-            {data.map((d: any) => {
+            {data.map((d) => {
               const y = d.count === 0 ? plotHeight : yScale(d.count)
               return (
                 <React.Fragment key={`${d.binIndex}`}>
@@ -233,9 +233,9 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
 
           <g transform={`translate(${margin.left}, 0)`}>
             {ranges
-              .filter((range: any) => range.start !== range.stop)
-              .filter((range: any) => range.start <= maxRepeats)
-              .map((range: any, rangeIndex: any) => {
+              .filter((range) => range.start !== range.stop)
+              .filter((range) => range.start <= maxRepeats)
+              .map((range, rangeIndex) => {
                 const startBinIndex = Math.floor(range.start / binSize)
                 const startX =
                   (xScale(startBinIndex) || 0) +
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx
index 7c2ecb89c..3f20344b8 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx
@@ -28,7 +28,7 @@ const ShortTandemRepeatRepeatUnits = ({ shortTandemRepeat }: ShortTandemRepeatRe
         label={`Repeat unit${(repeatUnitsByClassification as any).unknown.length > 1 ? 's' : ''}`}
       >
         <InlineList
-          items={(repeatUnitsByClassification as any).unknown.map((repeatUnit: any) => (
+          items={(repeatUnitsByClassification as any).unknown.map((repeatUnit: string) => (
             <span>
               {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
               shortTandemRepeat.repeat_units.length > 1
@@ -52,7 +52,7 @@ const ShortTandemRepeatRepeatUnits = ({ shortTandemRepeat }: ShortTandemRepeatRe
           tooltip="These repeat units have been reported in the literature as pathogenic when they expand beyond a certain threshold."
         >
           <InlineList
-            items={(repeatUnitsByClassification as any).pathogenic.map((repeatUnit: any) => (
+            items={(repeatUnitsByClassification as any).pathogenic.map((repeatUnit: string) => (
               <span>
                 {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
                 shortTandemRepeat.repeat_units.length > 1
@@ -74,7 +74,7 @@ const ShortTandemRepeatRepeatUnits = ({ shortTandemRepeat }: ShortTandemRepeatRe
           tooltip="These repeat units are regarded in the literature as benign, even when expanded."
         >
           <InlineList
-            items={(repeatUnitsByClassification as any).benign.map((repeatUnit: any) => (
+            items={(repeatUnitsByClassification as any).benign.map((repeatUnit: string) => (
               <span>
                 {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
                 shortTandemRepeat.repeat_units.length > 1
@@ -96,7 +96,7 @@ const ShortTandemRepeatRepeatUnits = ({ shortTandemRepeat }: ShortTandemRepeatRe
           tooltip="These are the other repeat units detected at this locus within gnomAD samples by the call_non_ref_pathogenic_motifs.py script."
         >
           <InlineList
-            items={(repeatUnitsByClassification as any).unknown.map((repeatUnit: any) => (
+            items={(repeatUnitsByClassification as any).unknown.map((repeatUnit: string) => (
               <span>
                 {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
                 shortTandemRepeat.repeat_units.length > 1
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
index 00ad37ee7..a813f1cf8 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
@@ -75,7 +75,9 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
               .flatMap(({ repeatUnits, distribution }) => [
                 {
                   repeatUnits,
-                  distribution: distribution.filter((d: any) => d[0] >= d[1]).filter(isInBin),
+                  distribution: distribution
+                    .filter((d) => d.long_allele_repunit_count >= d.short_allele_repunit_count)
+                    .filter(isInBin),
                 },
                 {
                   repeatUnits: [...repeatUnits].reverse(),
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 715b6b465..cbc20425c 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -190,7 +190,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
   Object.keys(allRepeatUnitsByClassification).forEach((classification) => {
     repeatUnitsFoundInGnomadByClassification[classification] = allRepeatUnitsByClassification[
       classification
-    ].filter((repeatUnit: any) => repeatUnitsFoundInGnomad.has(repeatUnit))
+    ].filter((repeatUnit) => repeatUnitsFoundInGnomad.has(repeatUnit))
   })
 
   const allRepeatUnitsFoundInGnomadArePathogenic = Object.keys(
@@ -319,7 +319,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
             <Select
               id={`short-tandem-repeat-${shortTandemRepeat.id}-repeat-unit`}
               value={selectedAlleleSizeRepeatUnit}
-              onChange={(e: any) => {
+              onChange={(e: { target: { value: string } }) => {
                 setSelectedAlleleSizeRepeatUnit(e.target.value)
               }}
             >
@@ -367,7 +367,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
                           1
                         )}`}
                       >
-                        {allRepeatUnitsByClassification[classification].map((repeatUnit: any) => {
+                        {allRepeatUnitsByClassification[classification].map((repeatUnit) => {
                           const foundInGnomad = repeatUnitsFoundInGnomad.has(repeatUnit)
                           const notes = []
                           if (repeatUnit === shortTandemRepeat.reference_repeat_unit) {
@@ -397,7 +397,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
             <Select
               id={`short-tandem-repeat-${shortTandemRepeat.id}-allele-size-distribution-scale`}
               value={selectedScaleType}
-              onChange={(e: any) => {
+              onChange={(e: { target: { value: ScaleType } }) => {
                 setSelectedScaleType(e.target.value)
               }}
             >
@@ -416,7 +416,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
               <Select
                 id={`short-tandem-repeat-${shortTandemRepeat.id}-allele-size-distribution-selected-disease`}
                 value={selectedDisease}
-                onChange={(e: any) => {
+                onChange={(e: { target: { value: string } }) => {
                   setSelectedDisease(e.target.value)
                 }}
               >
@@ -511,7 +511,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
               <Select
                 id={`short-tandem-repeat-${shortTandemRepeat.id}-genotype-distribution-selected-disease`}
                 value={selectedDisease}
-                onChange={(e: any) => {
+                onChange={(e: { target: { value: string } }) => {
                   setSelectedDisease(e.target.value)
                 }}
               >
@@ -541,7 +541,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
 
       {selectedGenotypeDistributionBin && (
         <Modal
-          title={(selectedGenotypeDistributionBin as any).label}
+          title={selectedGenotypeDistributionBin.label}
           size="large"
           // @ts-expect-error TS(2322) FIXME: Type '{ children: Element; title: any; size: "larg... Remove this comment to see the full error message
           initialFocusOnButton={false}
diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index 6e7b99abf..d2739abbd 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -165,17 +165,16 @@ export const getSelectedGenotypeDistribution = (
 }*/
 
 export const getGenotypeDistributionPlotAxisLabels = (
-  shortTandemRepeatOrAdjacentRepeat: any,
-  { selectedRepeatUnits }: any
+  shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat,
+  { selectedRepeatUnits }: { selectedRepeatUnits: string[] | '' }
 ) => {
-  if (selectedRepeatUnits) {
-    const repeatUnits = selectedRepeatUnits.split(' / ')
-    if (repeatUnits[0] === repeatUnits[1]) {
-      return shortTandemRepeatOrAdjacentRepeat.genotype_distribution.repeat_units.length === 1
+  if (selectedRepeatUnits !== '') {
+    if (selectedRepeatUnits[0] === selectedRepeatUnits[1]) {
+      return genotypeRepunitPairs(shortTandemRepeatOrAdjacentRepeat).length === 1
         ? ['longer allele', 'shorter allele']
-        : [`longer ${repeatUnits[0]} allele`, `shorter ${repeatUnits[1]} allele`]
+        : [`longer ${selectedRepeatUnits[0]} allele`, `shorter ${selectedRepeatUnits[1]} allele`]
     }
-    return repeatUnits.map((repeatUnit: any) => `${repeatUnit} allele`)
+    return selectedRepeatUnits.map((repeatUnit) => `${repeatUnit} allele`)
   }
   return ['longer allele', 'shorter allele']
 }

From 390d8bbec7aad74cb7603049f5274d937cae71a8 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Fri, 26 Jul 2024 14:42:31 -0400
Subject: [PATCH 11/36] WIP update query in frontend

---
 .../ShortTandemRepeatPageContainer.tsx        | 118 ++++++++----------
 1 file changed, 54 insertions(+), 64 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
index ba8d0cd18..d76b291c1 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
@@ -15,23 +15,21 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
   short_tandem_repeat(id: $strId, dataset: $datasetId) {
     id
     gene {
-      ensembl_id
       symbol
-      region
     }
     associated_diseases {
-      name
-      symbol
       omim_id
-      inheritance_mode
-      repeat_size_classifications {
-        classification
-        min
-        max
-      }
       notes
     }
-    reference_region {
+    stripy_id
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -42,80 +40,72 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
       age_range
       distribution
     }
-    stripy_id
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
+    age_distribution {
+      age_range
+      distribution
+    }
   }
 }
 `

From a026ed8895f9ec52d76b9309f2e3ca2eff02bffd Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Fri, 26 Jul 2024 15:06:52 -0400
Subject: [PATCH 12/36] WIP restoring classification

---
 browser/src/GenePage/GenePageContainer.tsx    |  1 -
 .../src/RegionPage/RegionPageContainer.tsx    |  1 -
 ...tGenotypeDistributionRepeatUnitsSelect.tsx |  6 +-
 .../shortTandemRepeatHelpers.ts               | 88 +++++--------------
 4 files changed, 23 insertions(+), 73 deletions(-)

diff --git a/browser/src/GenePage/GenePageContainer.tsx b/browser/src/GenePage/GenePageContainer.tsx
index 6d0ecdb1b..313e223f7 100644
--- a/browser/src/GenePage/GenePageContainer.tsx
+++ b/browser/src/GenePage/GenePageContainer.tsx
@@ -263,7 +263,6 @@ query ${operationName}($geneId: String, $geneSymbol: String, $referenceGenome: R
   }
 }
 `
-// TK check
 type Props = {
   datasetId: DatasetId
   geneIdOrSymbol: string
diff --git a/browser/src/RegionPage/RegionPageContainer.tsx b/browser/src/RegionPage/RegionPageContainer.tsx
index e468a7268..c24eaf0f3 100644
--- a/browser/src/RegionPage/RegionPageContainer.tsx
+++ b/browser/src/RegionPage/RegionPageContainer.tsx
@@ -47,7 +47,6 @@ const query = `
     }
   }
 `
-// TK check
 type Props = {
   datasetId: DatasetId
   regionId: string
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
index 05a426835..951308a0a 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
@@ -2,7 +2,7 @@ import React, { Dispatch, SetStateAction } from 'react'
 
 import { Select } from '@gnomad/ui'
 import { ShortTandemRepeat, ShortTandemRepeatAdjacentRepeat } from './ShortTandemRepeatPage'
-import { genotypeRepunitPairs } from './shortTandemRepeatHelpers'
+import { genotypeRepunitPairs, isAdjacentRepeat } from './shortTandemRepeatHelpers'
 
 type Props = {
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
@@ -10,10 +10,6 @@ type Props = {
   setSelectedRepeatUnits: Dispatch<SetStateAction<string[] | ''>>
 }
 
-const isAdjacentRepeat = (
-  obj: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
-): obj is ShortTandemRepeatAdjacentRepeat => !obj.hasOwnProperty('associated_diseases')
-
 const ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect = ({
   shortTandemRepeatOrAdjacentRepeat,
   selectedRepeatUnits,
diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index d2739abbd..413444111 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -30,11 +30,26 @@ const addCohortToAlleleSizeDistribution = (
     return { ...acc, [repunit_count]: newItem }
   }, distribution)
 
+const repunitsWithClassification = (
+  shortTandemRepeat: ShortTandemRepeat,
+  targetClassification: string
+): Set<string> =>
+  shortTandemRepeat.repeat_units.reduce(
+    (acc, repunit) =>
+      repunit.classification === targetClassification ? acc.add(repunit.repeat_unit) : acc,
+    new Set<string>()
+  )
+
 export const getSelectedAlleleSizeDistribution = (
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat,
   { selectedAncestryGroup, selectedSex, selectedRepeatUnit }: AlleleSizeDistributionFilters
 ): AlleleSizeDistributionItem[] => {
-  // TK figure out what's up with classification
+  const matchingRepunits: Set<string> =
+    selectedRepeatUnit.startsWith('classification') &&
+    !isAdjacentRepeat(shortTandemRepeatOrAdjacentRepeat)
+      ? repunitsWithClassification(shortTandemRepeatOrAdjacentRepeat, selectedRepeatUnit.slice(15))
+      : new Set([selectedRepeatUnit])
+
   const itemsByRepunitCount: Record<number, AlleleSizeDistributionItem> =
     shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.reduce((acc, cohort) => {
       if (selectedAncestryGroup !== '' && cohort.ancestry_group !== selectedAncestryGroup) {
@@ -43,58 +58,14 @@ export const getSelectedAlleleSizeDistribution = (
       if (selectedSex !== '' && cohort.sex !== selectedSex) {
         return acc
       }
-      if (cohort.repunit !== selectedRepeatUnit) {
+
+      if (!matchingRepunits.has(cohort.repunit)) {
         return acc
       }
       return addCohortToAlleleSizeDistribution(cohort, acc)
     }, {} as Record<number, AlleleSizeDistributionItem>)
   return Object.values(itemsByRepunitCount)
 }
-/*  if (selectedRepeatUnit) {
-    // Repeat units grouped by classification are not valid for adjacent repeats.
-    if (selectedRepeatUnit.startsWith('classification')) {
-      const selectedClassification = selectedRepeatUnit.slice(15)
-
-      const repeatUnitClassification = shortTandemRepeatOrAdjacentRepeat.repeat_units.reduce(
-        (acc, repeatUnit) => ({
-          ...acc,
-          [repeatUnit.repeat_unit]: repeatUnit.classification,
-        }),
-        {}
-      )
-
-      const repeatUnits =
-        shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.repeat_units.filter(
-          (r: any) => repeatUnitClassification[r.repeat_unit] === selectedClassification
-        )
-
-      const distributions = repeatUnits.map(
-        selectedPopulationId
-          ? (r: any) =>
-              r.populations.find((pop: any) => pop.id === selectedPopulationId).distribution
-          : (r: any) => r.distribution
-      )
-
-      return sumDistributions(distributions)
-    }
-
-    const repeatUnit = shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.repeat_units.find(
-      (r: any) => r.repeat_unit === selectedRepeatUnit
-    )
-    if (selectedPopulationId) {
-      return repeatUnit.populations.find((pop: any) => pop.id === selectedPopulationId).distribution
-    }
-    return repeatUnit.distribution
-  }
-
-  if (selectedPopulationId) {
-    return shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.populations.find(
-      (pop: any) => pop.id === selectedPopulationId
-    ).distribution
-  }
-
-  return shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.distribution
-}*/
 
 const addCohortToGenotypeDistribution = (
   cohort: GenotypeDistributionCohort,
@@ -145,25 +116,6 @@ export const getSelectedGenotypeDistribution = (
   return Object.values(itemsByRepunitCounts)
 }
 
-/* {
-  const baseDistribution = selectedRepeatUnits
-    ? shortTandemRepeatOrAdjacentRepeat.genotype_distribution.repeat_units.find(
-        (repeatUnit: any) => repeatUnit.repeat_units.join(' / ') === selectedRepeatUnits
-      )
-    : shortTandemRepeatOrAdjacentRepeat.genotype_distribution
-
-  const selectedDistribution =
-    selectedPopulationId === ''
-      ? baseDistribution.distribution
-      : baseDistribution.populations.find((pop: any) => pop.id === selectedPopulationId)
-          .distribution
-
-  return !selectedRepeatUnits ||
-    selectedRepeatUnits.split(' / ')[0] === selectedRepeatUnits.split(' / ')[1]
-    ? selectedDistribution.map((d: any) => (d[0] >= d[1] ? d : [d[1], d[0], d[2]]))
-    : selectedDistribution
-}*/
-
 export const getGenotypeDistributionPlotAxisLabels = (
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat,
   { selectedRepeatUnits }: { selectedRepeatUnits: string[] | '' }
@@ -217,3 +169,7 @@ export const genotypeRepunitPairs = (
     (a, b) => a[0].localeCompare(b[0]) || a[1].localeCompare(b[1])
   )
 }
+
+export const isAdjacentRepeat = (
+  obj: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
+): obj is ShortTandemRepeatAdjacentRepeat => !obj.hasOwnProperty('associated_diseases')

From 006a3f3ae3bdb5c1d1938b418bb7b0bece40b1cd Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Fri, 26 Jul 2024 15:33:37 -0400
Subject: [PATCH 13/36] WIP fixing query

---
 .../ShortTandemRepeatPageContainer.tsx           | 16 +++++++++++-----
 1 file changed, 11 insertions(+), 5 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
index d76b291c1..210a7bccf 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
@@ -15,13 +15,22 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
   short_tandem_repeat(id: $strId, dataset: $datasetId) {
     id
     gene {
+      ensembl_id
       symbol
+      region
     }
     associated_diseases {
+      name
+      symbol
       omim_id
+      inheritance_mode
+      repeat_size_classifications {
+        classification
+        min
+        max
+      }
       notes
     }
-    stripy_id
     main_reference_region {
       reference_genome
       chrom
@@ -67,6 +76,7 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       age_range
       distribution
     }
+    stripy_id
     adjacent_repeats {
       id
       reference_region {
@@ -102,10 +112,6 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
         frequency
       }
     }
-    age_distribution {
-      age_range
-      distribution
-    }
   }
 }
 `

From 6facef11a42406865c0e9656b3ca5d8210411de8 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Fri, 26 Jul 2024 15:54:44 -0400
Subject: [PATCH 14/36] DONTMERGE nerf reads

---
 browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
index a874706dd..fd93fb410 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
@@ -203,6 +203,9 @@ const ShortTandemRepeatReads = ({
   shortTandemRepeat,
   filter,
 }: ShortTandemRepeatReadsProps) => {
+  if (2 + 2 === 4) {
+    return <StatusMessage>TK fix reads</StatusMessage>
+  }
   const fetchReadsTimer = useRef<ReturnType<typeof setTimeout> | null>(null)
   const fetchNumReadsMemoized = useCallback(() => {
     if (fetchReadsTimer.current) {

From 246b989927b42cc21d70e99e99efc433c1735c25 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 29 Jul 2024 11:33:56 -0400
Subject: [PATCH 15/36] fixup fix ancestry and sex selectors

---
 .../ShortTandemRepeatPopulationOptions.tsx                  | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
index 94810daae..9545c9f7d 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
@@ -51,7 +51,9 @@ const ShortTandemRepeatPopulationOptions = ({
         <Select
           id={`short-tandem-repeat-${id}-population-options-population`}
           value={selectedAncestryGroup}
-          onChange={setSelectedAncestryGroup}
+          onChange={(e: { target: { value: AncestryGroupId | '' } }) =>
+            setSelectedAncestryGroup(e.target.value)
+          }
         >
           <option value="">Global</option>
           {ancestryGroupsSortedByName.map((ancestryGroup) => (
@@ -67,7 +69,7 @@ const ShortTandemRepeatPopulationOptions = ({
         <Select
           id={`short-tandem-repeat-${id}-population-options-sex`}
           value={selectedSex}
-          onChange={setSelectedSex}
+          onChange={(e: { target: { value: Sex | '' } }) => setSelectedSex(e.target.value)}
         >
           <option value="">All</option>
           <option value="XX">XX</option>

From 72f3713a5aabf571b33b2dfdd3aed6490e01607e Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 29 Jul 2024 11:47:25 -0400
Subject: [PATCH 16/36] fixup: fix allele size plot when no selected repunit

---
 browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index 413444111..61ce2f7fb 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -59,7 +59,7 @@ export const getSelectedAlleleSizeDistribution = (
         return acc
       }
 
-      if (!matchingRepunits.has(cohort.repunit)) {
+      if (selectedRepeatUnit !== '' && !matchingRepunits.has(cohort.repunit)) {
         return acc
       }
       return addCohortToAlleleSizeDistribution(cohort, acc)

From c43690f41a54c5c5191f06f5f7e6ee3bc358f17e Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Thu, 10 Oct 2024 19:41:37 -0400
Subject: [PATCH 17/36] misc. updates to TR page in preparation for new release

---
 ...TandemRepeatAlleleSizeDistributionPlot.tsx |   1 -
 .../ShortTandemRepeatAttributes.tsx           | 157 +++++++++++-------
 ...tGenotypeDistributionRepeatUnitsSelect.tsx |   5 +-
 .../ShortTandemRepeatPage.tsx                 | 151 +++++++++--------
 .../ShortTandemRepeatPopulationOptions.tsx    |  14 +-
 .../ShortTandemRepeatReads.tsx                |  58 ++++---
 6 files changed, 214 insertions(+), 172 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index 755f946b7..1b24f620c 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -91,7 +91,6 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
 
       return d
     }, [alleleSizeDistribution, nBins, binSize])
-
     const xScale = scaleBand<number>()
       .domain(data.map((d) => d.binIndex))
       .range([0, plotWidth])
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx
index 3f20344b8..764772677 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAttributes.tsx
@@ -42,76 +42,109 @@ const ShortTandemRepeatRepeatUnits = ({ shortTandemRepeat }: ShortTandemRepeatRe
     )
   }
 
-  return (
-    <>
-      {(repeatUnitsByClassification as any).pathogenic && (
-        <AttributeListItem
-          label={`Pathogenic repeat unit${
-            (repeatUnitsByClassification as any).pathogenic.length > 1 ? 's' : ''
-          }`}
-          tooltip="These repeat units have been reported in the literature as pathogenic when they expand beyond a certain threshold."
-        >
-          <InlineList
-            items={(repeatUnitsByClassification as any).pathogenic.map((repeatUnit: string) => (
-              <span>
-                {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
-                shortTandemRepeat.repeat_units.length > 1
-                  ? `${repeatUnit} (reference)`
-                  : repeatUnit}
-              </span>
-            ))}
+  if (
+    (repeatUnitsByClassification as any).pathogenic &&
+    (repeatUnitsByClassification as any).pathogenic.length == 1 &&
+    !(repeatUnitsByClassification as any).benign &&
+    !(repeatUnitsByClassification as any).unknown
+  ) {
+    return (
+      <>
+        {(repeatUnitsByClassification as any).pathogenic && (
+          <AttributeListItem
+            label={`Repeat unit${
+              (repeatUnitsByClassification as any).pathogenic.length > 1 ? 's' : ''
+            }`}
+          >
+            <InlineList
+              items={(repeatUnitsByClassification as any).pathogenic.map((repeatUnit: string) => (
+                <span>
+                  {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
+                  shortTandemRepeat.repeat_units.length > 1
+                    ? `${repeatUnit} (reference)`
+                    : repeatUnit}
+                </span>
+              ))}
+              label={`Pathogenic repeat unit${
+                (repeatUnitsByClassification as any).pathogenic.length > 1 ? 's' : ''
+              }`}
+            />
+          </AttributeListItem>
+        )}
+      </>
+    )
+  } else {
+    return (
+      <>
+        {(repeatUnitsByClassification as any).pathogenic && (
+          <AttributeListItem
             label={`Pathogenic repeat unit${
               (repeatUnitsByClassification as any).pathogenic.length > 1 ? 's' : ''
             }`}
-          />
-        </AttributeListItem>
-      )}
-      {(repeatUnitsByClassification as any).benign && (
-        <AttributeListItem
-          label={`Benign repeat unit${
-            (repeatUnitsByClassification as any).benign.length > 1 ? 's' : ''
-          }`}
-          tooltip="These repeat units are regarded in the literature as benign, even when expanded."
-        >
-          <InlineList
-            items={(repeatUnitsByClassification as any).benign.map((repeatUnit: string) => (
-              <span>
-                {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
-                shortTandemRepeat.repeat_units.length > 1
-                  ? `${repeatUnit} (reference)`
-                  : repeatUnit}
-              </span>
-            ))}
+            tooltip="These repeat units have been reported in the literature as pathogenic when they expand beyond a certain threshold."
+          >
+            <InlineList
+              items={(repeatUnitsByClassification as any).pathogenic.map((repeatUnit: string) => (
+                <span>
+                  {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
+                  shortTandemRepeat.repeat_units.length > 1
+                    ? `${repeatUnit} (reference)`
+                    : repeatUnit}
+                </span>
+              ))}
+              label={`Pathogenic repeat unit${
+                (repeatUnitsByClassification as any).pathogenic.length > 1 ? 's' : ''
+              }`}
+            />
+          </AttributeListItem>
+        )}
+        {(repeatUnitsByClassification as any).benign && (
+          <AttributeListItem
             label={`Benign repeat unit${
               (repeatUnitsByClassification as any).benign.length > 1 ? 's' : ''
             }`}
-          />
-        </AttributeListItem>
-      )}
-      {(repeatUnitsByClassification as any).unknown && (
-        <AttributeListItem
-          label={`Other repeat unit${
-            (repeatUnitsByClassification as any).unknown.length > 1 ? 's' : ''
-          }`}
-          tooltip="These are the other repeat units detected at this locus within gnomAD samples by the call_non_ref_pathogenic_motifs.py script."
-        >
-          <InlineList
-            items={(repeatUnitsByClassification as any).unknown.map((repeatUnit: string) => (
-              <span>
-                {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
-                shortTandemRepeat.repeat_units.length > 1
-                  ? `${repeatUnit} (reference)`
-                  : repeatUnit}
-              </span>
-            ))}
+            tooltip="These repeat units are regarded in the literature as benign, even when expanded."
+          >
+            <InlineList
+              items={(repeatUnitsByClassification as any).benign.map((repeatUnit: string) => (
+                <span>
+                  {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
+                  shortTandemRepeat.repeat_units.length > 1
+                    ? `${repeatUnit} (reference)`
+                    : repeatUnit}
+                </span>
+              ))}
+              label={`Benign repeat unit${
+                (repeatUnitsByClassification as any).benign.length > 1 ? 's' : ''
+              }`}
+            />
+          </AttributeListItem>
+        )}
+        {(repeatUnitsByClassification as any).unknown && (
+          <AttributeListItem
             label={`Other repeat unit${
               (repeatUnitsByClassification as any).unknown.length > 1 ? 's' : ''
             }`}
-          />
-        </AttributeListItem>
-      )}
-    </>
-  )
+            tooltip="These are the other repeat units detected at this locus within gnomAD samples by the call_non_ref_pathogenic_motifs.py script."
+          >
+            <InlineList
+              items={(repeatUnitsByClassification as any).unknown.map((repeatUnit: string) => (
+                <span>
+                  {repeatUnit === shortTandemRepeat.reference_repeat_unit &&
+                  shortTandemRepeat.repeat_units.length > 1
+                    ? `${repeatUnit} (reference)`
+                    : repeatUnit}
+                </span>
+              ))}
+              label={`Other repeat unit${
+                (repeatUnitsByClassification as any).unknown.length > 1 ? 's' : ''
+              }`}
+            />
+          </AttributeListItem>
+        )}
+      </>
+    )
+  }
 }
 
 type ShortTandemRepeatAttributesProps = {
@@ -131,7 +164,7 @@ const ShortTandemRepeatAttributes = ({ shortTandemRepeat }: ShortTandemRepeatAtt
         <Link
           to={`/region/${shortTandemRepeat.main_reference_region.chrom}-${shortTandemRepeat.main_reference_region.start}-${shortTandemRepeat.main_reference_region.stop}`}
         >
-          {shortTandemRepeat.main_reference_region.chrom}-
+          {shortTandemRepeat.main_reference_region.chrom}:
           {shortTandemRepeat.main_reference_region.start}-
           {shortTandemRepeat.main_reference_region.stop}
         </Link>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
index 951308a0a..55e4f1294 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect.tsx
@@ -27,6 +27,9 @@ const ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect = ({
 
   const repunitPairs = genotypeRepunitPairs(shortTandemRepeatOrAdjacentRepeat)
 
+  if (repunitPairs.length == 1) {
+    return null
+  }
   return (
     <label
       htmlFor={`short-tandem-repeat-${shortTandemRepeatOrAdjacentRepeat.id}-genotype-distribution-repeat-units`}
@@ -40,7 +43,7 @@ const ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect = ({
           setSelectedRepeatUnits(newPair)
         }}
       >
-        {repunitPairs.length > 1 && <option value="">All</option>}
+        <option value="">All</option>
         <optgroup label="Repeat unit pairs (only pairs found in gnomAD are listed here)">
           {repunitPairs.map((pair) => {
             return (
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index cbc20425c..5e6069dea 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -258,12 +258,20 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
                     STRipy
                   </ExternalLink>
                 </ListItem>
+                <ListItem>
+                  {/* @ts-expect-error TS(2786) FIXME: 'ExternalLink' cannot be used as a JSX component. */}
+                  <ExternalLink
+                    href={`https://strchive.org/database/${shortTandemRepeat.stripy_id}.html`}
+                  >
+                    STRchive
+                  </ExternalLink>
+                </ListItem>
               </List>
             </>
           )}
-          <h2>Related Loci</h2>
+          <h2>TRs in gnomAD</h2>
           <p>
-            <Link to="/short-tandem-repeats">Table of tandem repeat loci in gnomAD</Link>
+            <Link to="/short-tandem-repeats">Known disease-associated TRs </Link>
           </p>
         </ResponsiveSection>
       </FlexWrapper>
@@ -314,81 +322,70 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
             setSelectedSex={setSelectedSex}
           />
 
-          <label htmlFor={`short-tandem-repeat-${shortTandemRepeat.id}-repeat-unit`}>
-            Repeat unit: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
-            <Select
-              id={`short-tandem-repeat-${shortTandemRepeat.id}-repeat-unit`}
-              value={selectedAlleleSizeRepeatUnit}
-              onChange={(e: { target: { value: string } }) => {
-                setSelectedAlleleSizeRepeatUnit(e.target.value)
-              }}
-            >
-              {alleleSizeDistributionRepunits.length === 1 ? (
-                <option
-                  key={alleleSizeDistributionRepunits[0]}
-                  value={alleleSizeDistributionRepunits[0]}
-                >
-                  {alleleSizeDistributionRepunits[0]}
-                </option>
-              ) : (
-                <>
-                  <option value="">All</option>
-                  {Object.keys(allRepeatUnitsByClassification).length > 1 && (
-                    <>
-                      <optgroup label="Grouped by classification">
-                        {['pathogenic', 'benign', 'unknown'].map((classification) => {
-                          const foundInGnomad =
-                            (repeatUnitsFoundInGnomadByClassification[classification] || [])
-                              .length > 0
-                          return (
-                            <option
-                              key={classification}
-                              value={`classification/${classification}`}
-                              disabled={!foundInGnomad}
-                            >
-                              {foundInGnomad
-                                ? `All ${classification}`
-                                : `All ${classification} (not found in gnomAD)`}
-                            </option>
-                          )
-                        })}
-                      </optgroup>
-                    </>
-                  )}
-                  {['pathogenic', 'benign', 'unknown']
-                    .filter(
-                      (classification) =>
-                        (allRepeatUnitsByClassification[classification] || []).length > 0
-                    )
-                    .map((classification) => (
-                      <optgroup
-                        key={classification}
-                        label={`${classification.charAt(0).toUpperCase()}${classification.slice(
-                          1
-                        )}`}
-                      >
-                        {allRepeatUnitsByClassification[classification].map((repeatUnit) => {
-                          const foundInGnomad = repeatUnitsFoundInGnomad.has(repeatUnit)
-                          const notes = []
-                          if (repeatUnit === shortTandemRepeat.reference_repeat_unit) {
-                            notes.push('reference')
-                          }
-                          if (!foundInGnomad) {
-                            notes.push('not found in gnomAD')
-                          }
-                          return (
-                            <option key={repeatUnit} value={repeatUnit} disabled={!foundInGnomad}>
-                              {repeatUnit}
-                              {notes.length > 0 && ` (${notes.join(', ')})`}
-                            </option>
-                          )
-                        })}
-                      </optgroup>
-                    ))}
-                </>
-              )}
-            </Select>
-          </label>
+          {alleleSizeDistributionRepunits.length > 1 && (
+            <label htmlFor={`short-tandem-repeat-${shortTandemRepeat.id}-repeat-unit`}>
+              Repeat unit: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
+              <Select
+                id={`short-tandem-repeat-${shortTandemRepeat.id}-repeat-unit`}
+                value={selectedAlleleSizeRepeatUnit}
+                onChange={(e: { target: { value: string } }) => {
+                  setSelectedAlleleSizeRepeatUnit(e.target.value)
+                }}
+              >
+                <option value="">All</option>
+                {Object.keys(allRepeatUnitsByClassification).length > 1 && (
+                  <>
+                    <optgroup label="Grouped by classification">
+                      {['pathogenic', 'benign', 'unknown'].map((classification) => {
+                        const foundInGnomad =
+                          (repeatUnitsFoundInGnomadByClassification[classification] || []).length >
+                          0
+                        return (
+                          <option
+                            key={classification}
+                            value={`classification/${classification}`}
+                            disabled={!foundInGnomad}
+                          >
+                            {foundInGnomad
+                              ? `All ${classification}`
+                              : `All ${classification} (not found in gnomAD)`}
+                          </option>
+                        )
+                      })}
+                    </optgroup>
+                  </>
+                )}
+                {['pathogenic', 'benign', 'unknown']
+                  .filter(
+                    (classification) =>
+                      (allRepeatUnitsByClassification[classification] || []).length > 0
+                  )
+                  .map((classification) => (
+                    <optgroup
+                      key={classification}
+                      label={`${classification.charAt(0).toUpperCase()}${classification.slice(1)}`}
+                    >
+                      {allRepeatUnitsByClassification[classification].map((repeatUnit) => {
+                        const foundInGnomad = repeatUnitsFoundInGnomad.has(repeatUnit)
+                        const notes = []
+                        if (repeatUnit === shortTandemRepeat.reference_repeat_unit) {
+                          notes.push('reference')
+                        }
+                        if (!foundInGnomad) {
+                          notes.push('not found in gnomAD')
+                        }
+                        return (
+                          <option key={repeatUnit} value={repeatUnit} disabled={!foundInGnomad}>
+                            {repeatUnit}
+                            {notes.length > 0 && ` (${notes.join(', ')})`}
+                          </option>
+                        )
+                      })}
+                    </optgroup>
+                  ))}
+              </Select>
+            </label>
+          )}
 
           <label
             htmlFor={`short-tandem-repeat-${shortTandemRepeat.id}-allele-size-distribution-scale`}
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
index 9545c9f7d..96101dcde 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
@@ -22,6 +22,10 @@ const Wrapper = styled.div`
   }
 `
 
+const Label = styled.label`
+  padding-right: 1em;
+`
+
 type Props = {
   id: string
   ancestryGroups: AncestryGroupId[]
@@ -45,8 +49,8 @@ const ShortTandemRepeatPopulationOptions = ({
 
   return (
     <Wrapper>
-      <label htmlFor={`short-tandem-repeat-${id}-population-options-population`}>
-        Genetic ancestry group:{' '}
+      <Label htmlFor={`short-tandem-repeat-${id}-population-options-population`}>
+        Genetic ancestry group: &nbsp;
         {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
         <Select
           id={`short-tandem-repeat-${id}-population-options-population`}
@@ -62,9 +66,9 @@ const ShortTandemRepeatPopulationOptions = ({
             </option>
           ))}
         </Select>
-      </label>
+      </Label>
 
-      <label htmlFor={`short-tandem-repeat-${id}-population-options-sex`}>
+      <Label htmlFor={`short-tandem-repeat-${id}-population-options-sex`}>
         Sex: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
         <Select
           id={`short-tandem-repeat-${id}-population-options-sex`}
@@ -75,7 +79,7 @@ const ShortTandemRepeatPopulationOptions = ({
           <option value="XX">XX</option>
           <option value="XY">XY</option>
         </Select>
-      </label>
+      </Label>
     </Wrapper>
   )
 }
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
index fd93fb410..b36bbab57 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
@@ -340,6 +340,9 @@ const ShortTandemRepeatReadsAllelesFilterControlWrapper = styled.div`
     width: 12ch;
   }
 `
+const Label = styled.label`
+  padding-right: 1em;
+`
 
 type ShortTandemRepeatReadsAllelesFilterControlsProps = {
   shortTandemRepeat: ShortTandemRepeat
@@ -363,30 +366,33 @@ const ShortTandemRepeatReadsAllelesFilterControls = ({
     <ShortTandemRepeatReadsAllelesFilterControlsWrapper>
       {[0, 1].map((alleleIndex) => (
         <ShortTandemRepeatReadsAllelesFilterControlWrapper key={`${alleleIndex}`}>
-          Allele {alleleIndex + 1}: {/* eslint-disable jsx-a11y/label-has-associated-control */}
-          <label htmlFor={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-repeat-unit`}>
-            Repeat unit {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
-            <Select
-              id={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-repeat-unit`}
-              value={value[alleleIndex].repeat_unit || ''}
-              onChange={(e: any) => {
-                const newRepeatUnit = e.target.value
-                onChange(
-                  value.map((v, i) =>
-                    i === alleleIndex ? { ...v, repeat_unit: newRepeatUnit } : v
+          Allele {alleleIndex + 1}: &nbsp;{' '}
+          {/* eslint-disable jsx-a11y/label-has-associated-control */}
+          {alleleSizeDistributionRepeatUnits.length > 1 && (
+            <Label htmlFor={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-repeat-unit`}>
+              Repeat unit {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
+              <Select
+                id={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-repeat-unit`}
+                value={value[alleleIndex].repeat_unit || ''}
+                onChange={(e: any) => {
+                  const newRepeatUnit = e.target.value
+                  onChange(
+                    value.map((v, i) =>
+                      i === alleleIndex ? { ...v, repeat_unit: newRepeatUnit } : v
+                    )
                   )
-                )
-              }}
-            >
-              {alleleSizeDistributionRepeatUnits.length > 1 && <option value="">Any</option>}
-              {alleleSizeDistributionRepeatUnits.map((repeatUnit) => (
-                <option key={repeatUnit} value={repeatUnit}>
-                  {repeatUnit}
-                </option>
-              ))}
-            </Select>
-          </label>{' '}
-          <label htmlFor={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-min-repeats`}>
+                }}
+              >
+                {alleleSizeDistributionRepeatUnits.length > 1 && <option value="">Any</option>}
+                {alleleSizeDistributionRepeatUnits.map((repeatUnit) => (
+                  <option key={repeatUnit} value={repeatUnit}>
+                    {repeatUnit}
+                  </option>
+                ))}
+              </Select>
+            </Label>
+          )}
+          <Label htmlFor={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-min-repeats`}>
             Min repeats {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
             <Input
               type="number"
@@ -403,8 +409,8 @@ const ShortTandemRepeatReadsAllelesFilterControls = ({
                 )
               }}
             />
-          </label>{' '}
-          <label htmlFor={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-max-repeats`}>
+          </Label>{' '}
+          <Label htmlFor={`short-tandem-repeat-reads-filter-allele-${alleleIndex}-max-repeats`}>
             Max repeats {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
             <Input
               type="number"
@@ -421,7 +427,7 @@ const ShortTandemRepeatReadsAllelesFilterControls = ({
                 )
               }}
             />
-          </label>
+          </Label>
           {/* eslint-enable jsx-a11y/label-has-associated-control */}
         </ShortTandemRepeatReadsAllelesFilterControlWrapper>
       ))}

From c28caaed2d68382eaa82c9a9d91f8ee20fa6709b Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Wed, 30 Oct 2024 13:19:45 -0400
Subject: [PATCH 18/36] renamed 'AncestryGroup' to 'Population' and 'frequnecy'
 to 'count'

---
 ...ShortTandemRepeatAdjacentRepeatSection.tsx | 32 ++++++-------
 ...TandemRepeatAlleleSizeDistributionPlot.tsx |  4 +-
 ...emRepeatGenotypeDistributionBinDetails.tsx | 22 +++++----
 ...rtTandemRepeatGenotypeDistributionPlot.tsx |  6 +--
 .../ShortTandemRepeatPage.tsx                 | 48 ++++++++++---------
 .../ShortTandemRepeatPageContainer.tsx        |  8 ++--
 .../ShortTandemRepeatPopulationOptions.tsx    | 35 +++++++-------
 .../ShortTandemRepeatReads.tsx                |  7 +--
 .../shortTandemRepeatHelpers.ts               | 28 ++++++-----
 9 files changed, 99 insertions(+), 91 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
index 921dadb9d..373cb72a8 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
@@ -19,30 +19,30 @@ import {
   maxAlleleSizeDistributionRepeats,
   maxGenotypeDistributionRepeats,
 } from './shortTandemRepeatHelpers'
-import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
+import { PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 import { Bin as GenotypeBin } from './ShortTandemRepeatGenotypeDistributionPlot'
 
 type Props = {
   adjacentRepeat: ShortTandemRepeatAdjacentRepeat
   selectedScaleType: ScaleType
-  selectedAncestryGroup: AncestryGroupId | ''
+  selectedPopulation: PopulationId | ''
   selectedSex: Sex | ''
-  ancestryGroups: AncestryGroupId[]
+  populations: PopulationId[]
   selectedGenotypeDistributionBin: GenotypeBin | null
   setSelectedGenotypeDistributionBin: Dispatch<SetStateAction<GenotypeBin | null>>
   setSelectedScaleType: Dispatch<SetStateAction<ScaleType>>
-  setSelectedAncestryGroup: Dispatch<SetStateAction<AncestryGroupId | ''>>
+  setSelectedPopulation: Dispatch<SetStateAction<PopulationId | ''>>
   setSelectedSex: Dispatch<SetStateAction<Sex | ''>>
 }
 
 const ShortTandemRepeatAdjacentRepeatSection = ({
   adjacentRepeat,
-  ancestryGroups,
+  populations,
   selectedScaleType,
-  selectedAncestryGroup,
+  selectedPopulation,
   selectedSex,
   setSelectedScaleType,
-  setSelectedAncestryGroup,
+  setSelectedPopulation,
   setSelectedSex,
 }: Props) => {
   const [selectedRepeatUnit, setSelectedRepeatUnit] = useState(
@@ -67,7 +67,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
       <ShortTandemRepeatAlleleSizeDistributionPlot
         maxRepeats={maxAlleleSizeDistributionRepeats(adjacentRepeat)}
         alleleSizeDistribution={getSelectedAlleleSizeDistribution(adjacentRepeat, {
-          selectedAncestryGroup,
+          selectedPopulation,
           selectedSex,
           selectedRepeatUnit,
         })}
@@ -77,10 +77,10 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
       <ControlSection>
         <ShortTandemRepeatPopulationOptions
           id={`${adjacentRepeat.id}-repeat-counts`}
-          ancestryGroups={ancestryGroups}
-          selectedAncestryGroup={selectedAncestryGroup}
+          populations={populations}
+          selectedPopulation={selectedPopulation}
           selectedSex={selectedSex}
-          setSelectedAncestryGroup={setSelectedAncestryGroup}
+          setSelectedPopulation={setSelectedPopulation}
           setSelectedSex={setSelectedSex}
         />
 
@@ -128,7 +128,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
         maxRepeats={maxGenotypeDistributionRepeats(adjacentRepeat)}
         genotypeDistribution={getSelectedGenotypeDistribution(adjacentRepeat, {
           selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
-          selectedAncestryGroup: selectedAncestryGroup,
+          selectedPopulation: selectedPopulation,
           selectedSex: selectedSex,
         })}
         onSelectBin={(bin: GenotypeBin) => {
@@ -143,10 +143,10 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
       <ControlSection>
         <ShortTandemRepeatPopulationOptions
           id={`${adjacentRepeat.id}-genotype-distribution`}
-          ancestryGroups={ancestryGroups}
-          selectedAncestryGroup={selectedAncestryGroup}
+          populations={populations}
+          selectedPopulation={selectedPopulation}
           selectedSex={selectedSex}
-          setSelectedAncestryGroup={setSelectedAncestryGroup}
+          setSelectedPopulation={setSelectedPopulation}
           setSelectedSex={setSelectedSex}
         />
 
@@ -171,7 +171,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
             shortTandemRepeatOrAdjacentRepeat={adjacentRepeat}
             selectedRepeatUnits={selectedGenotypeDistributionRepeatUnits}
             bin={selectedGenotypeDistributionBin}
-            selectedAncestryGroup={selectedAncestryGroup}
+            selectedPopulation={selectedPopulation}
             selectedSex={selectedSex}
             repeatUnitPairs={genotypeDistributionPairs}
           />
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index 1b24f620c..d4899af45 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -84,9 +84,9 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
         count: 0,
       }))
 
-      alleleSizeDistribution.forEach(({ repunit_count, frequency }) => {
+      alleleSizeDistribution.forEach(({ repunit_count, allele_count }) => {
         const binIndex = Math.floor(repunit_count / binSize)
-        d[binIndex].count += frequency
+        d[binIndex].count += allele_count
       })
 
       return d
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
index a813f1cf8..3890dec1f 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
@@ -9,11 +9,11 @@ import {
   GenotypeDistributionItem,
 } from './ShortTandemRepeatPage'
 import { getSelectedGenotypeDistribution } from './shortTandemRepeatHelpers'
-import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
+import { PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 type Props = {
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
-  selectedAncestryGroup: AncestryGroupId | ''
+  selectedPopulation: PopulationId | ''
   selectedSex: Sex | ''
   selectedRepeatUnits: string[] | ''
   repeatUnitPairs: string[][]
@@ -26,14 +26,14 @@ type Props = {
 
 const ShortTandemRepeatGenotypeDistributionBinDetails = ({
   shortTandemRepeatOrAdjacentRepeat,
-  selectedAncestryGroup,
+  selectedPopulation,
   selectedSex,
   selectedRepeatUnits,
   repeatUnitPairs,
   bin,
 }: Props) => {
   const genotypeDistribution = getSelectedGenotypeDistribution(shortTandemRepeatOrAdjacentRepeat, {
-    selectedAncestryGroup,
+    selectedPopulation,
     selectedRepeatUnits,
     selectedSex,
   })
@@ -50,11 +50,11 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
       <List>
         {genotypeDistribution
           .filter(isInBin)
-          .map(({ long_allele_repunit_count, short_allele_repunit_count, frequency }) => (
+          .map(({ long_allele_repunit_count, short_allele_repunit_count, genotype_count }) => (
             // @ts-expect-error TS(2769) FIXME: No overload matches this call.
             <ListItem key={`${long_allele_repunit_count}/${short_allele_repunit_count}`}>
               {long_allele_repunit_count} repeats / {short_allele_repunit_count} repeats:{' '}
-              {frequency} individuals
+              {genotype_count} individuals
             </ListItem>
           ))}
       </List>
@@ -67,7 +67,7 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
               .map((repeatUnits) => ({
                 repeatUnits,
                 distribution: getSelectedGenotypeDistribution(shortTandemRepeatOrAdjacentRepeat, {
-                  selectedAncestryGroup,
+                  selectedPopulation,
                   selectedSex,
                   selectedRepeatUnits: repeatUnits,
                 }),
@@ -98,13 +98,17 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
                   {/* @ts-expect-error TS(2745) FIXME: This JSX tag's 'children' prop expects type 'never... Remove this comment to see the full error message */}
                   <List>
                     {distribution.map(
-                      ({ short_allele_repunit_count, long_allele_repunit_count, frequency }) => (
+                      ({
+                        short_allele_repunit_count,
+                        long_allele_repunit_count,
+                        genotype_count,
+                      }) => (
                         // @ts-expect-error TS(2769) FIXME: No overload matches this call.
                         <ListItem
                           key={`${long_allele_repunit_count}/${short_allele_repunit_count}`}
                         >
                           {long_allele_repunit_count} repeats / {short_allele_repunit_count}{' '}
-                          repeats: {frequency} individuals
+                          repeats: {genotype_count} individuals
                         </ListItem>
                       )
                     )}
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
index cf4269fd6..69fd8d07d 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
@@ -104,10 +104,10 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
     })
 
     genotypeDistribution.forEach(
-      ({ short_allele_repunit_count, long_allele_repunit_count, frequency }) => {
+      ({ short_allele_repunit_count, long_allele_repunit_count, genotype_count }) => {
         const xBinIndex = Math.floor(short_allele_repunit_count / xBinSize)
         const yBinIndex = Math.floor(long_allele_repunit_count / yBinSize)
-        data[xBinIndex * yNumBins + yBinIndex].count += frequency
+        data[xBinIndex * yNumBins + yBinIndex].count += genotype_count
       }
     )
 
@@ -145,7 +145,7 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
     }
 
     const opacityScale = scaleLog()
-      .domain([1, max(genotypeDistribution, (d) => d.frequency) || 2])
+      .domain([1, max(genotypeDistribution, (d) => d.genotype_count) || 2])
       .range([0.1, 1])
 
     return (
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 5e6069dea..aff7f8c49 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -29,7 +29,7 @@ import {
   genotypeRepunitPairs,
 } from './shortTandemRepeatHelpers'
 import ShortTandemRepeatAdjacentRepeatSection from './ShortTandemRepeatAdjacentRepeatSection'
-import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
+import { PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 type ShortTandemRepeatReferenceRegion = {
   chrom: string
@@ -37,15 +37,18 @@ type ShortTandemRepeatReferenceRegion = {
   stop: number
 }
 
+export type GenotypeQuality = 'low' | 'medium-low' | 'medium' | 'medium-high' | 'high'
+
 export type AlleleSizeDistributionItem = {
   repunit_count: number
-  frequency: number
+  allele_count: number
+  manual_genotype_quality: GenotypeQuality
 }
 
 export type Sex = 'XX' | 'XY'
 
 export type AlleleSizeDistributionCohort = {
-  ancestry_group: AncestryGroupId
+  ancestry_group: PopulationId
   sex: Sex
   repunit: string
   quality_description: string
@@ -56,7 +59,7 @@ export type AlleleSizeDistributionCohort = {
 export type GenotypeDistributionItem = {
   short_allele_repunit_count: number
   long_allele_repunit_count: number
-  frequency: number
+  genotype_count: number
 }
 
 export type GenotypeDistributionCohort = {
@@ -158,7 +161,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
     genotypeDistributionRepunitPairs.length === 1 ? genotypeDistributionRepunitPairs[0] : ''
   const defaultDisease = shortTandemRepeat.associated_diseases[0].name
 
-  const [selectedAncestryGroup, setSelectedAncestryGroup] = useState<AncestryGroupId | ''>('')
+  const [selectedPopulation, setSelectedPopulation] = useState<PopulationId | ''>('')
   const [selectedSex, setSelectedSex] = useState<Sex | ''>('')
   const [selectedAlleleSizeRepeatUnit, setSelectedAlleleSizeRepeatUnit] =
     useState<string>(defaultAlleleSizeRepunit)
@@ -168,7 +171,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
   const [selectedScaleType, setSelectedScaleType] = useState<ScaleType>('linear')
   const [showAdjacentRepeats, setShowAdjacentRepeats] = useState<boolean>(false)
 
-  const ancestryGroups = [
+  const populations = [
     ...new Set(shortTandemRepeat.allele_size_distribution.map((cohort) => cohort.ancestry_group)),
   ].sort()
 
@@ -258,6 +261,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
                     STRipy
                   </ExternalLink>
                 </ListItem>
+                {/* @ts-expect-error TS(2745) FIXME: This JSX tag's 'children' prop expects type 'never... Remove this comment to see the full error message */}
                 <ListItem>
                   {/* @ts-expect-error TS(2786) FIXME: 'ExternalLink' cannot be used as a JSX component. */}
                   <ExternalLink
@@ -291,7 +295,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         <ShortTandemRepeatAlleleSizeDistributionPlot
           maxRepeats={maxAlleleRepeats}
           alleleSizeDistribution={getSelectedAlleleSizeDistribution(shortTandemRepeat, {
-            selectedAncestryGroup,
+            selectedPopulation,
             selectedSex,
             selectedRepeatUnit: selectedAlleleSizeRepeatUnit,
           })}
@@ -315,10 +319,10 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         <ControlSection style={{ marginTop: '0.5em' }}>
           <ShortTandemRepeatPopulationOptions
             id={`${shortTandemRepeat.id}-repeat-counts`}
-            ancestryGroups={ancestryGroups}
-            selectedAncestryGroup={selectedAncestryGroup}
+            populations={populations}
+            selectedPopulation={selectedPopulation}
             selectedSex={selectedSex}
-            setSelectedAncestryGroup={setSelectedAncestryGroup}
+            setSelectedPopulation={setSelectedPopulation}
             setSelectedSex={setSelectedSex}
           />
 
@@ -454,7 +458,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           maxRepeats={maxGenotypeDistributionRepeats(shortTandemRepeat)}
           genotypeDistribution={getSelectedGenotypeDistribution(shortTandemRepeat, {
             selectedRepeatUnits: selectedGenotypeDistributionRepeatUnits,
-            selectedAncestryGroup,
+            selectedPopulation,
             selectedSex,
           })}
           xRanges={
@@ -486,10 +490,10 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         <ControlSection style={{ marginTop: '0.5em' }}>
           <ShortTandemRepeatPopulationOptions
             id={`${shortTandemRepeat.id}-genotype-distribution`}
-            ancestryGroups={ancestryGroups}
-            selectedAncestryGroup={selectedAncestryGroup}
+            populations={populations}
+            selectedPopulation={selectedPopulation}
             selectedSex={selectedSex}
-            setSelectedAncestryGroup={setSelectedAncestryGroup}
+            setSelectedPopulation={setSelectedPopulation}
             setSelectedSex={setSelectedSex}
           />
           <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
@@ -550,7 +554,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
             shortTandemRepeatOrAdjacentRepeat={shortTandemRepeat}
             bin={selectedGenotypeDistributionBin}
             selectedRepeatUnits={selectedGenotypeDistributionRepeatUnits}
-            selectedAncestryGroup={selectedAncestryGroup}
+            selectedPopulation={selectedPopulation}
             selectedSex={selectedSex}
             repeatUnitPairs={genotypeDistributionRepunitPairs}
           />
@@ -584,12 +588,12 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
                 <ShortTandemRepeatAdjacentRepeatSection
                   key={adjacentRepeat.id}
                   adjacentRepeat={adjacentRepeat}
-                  ancestryGroups={ancestryGroups}
-                  selectedAncestryGroup={selectedAncestryGroup}
+                  populations={populations}
+                  selectedPopulation={selectedPopulation}
                   selectedSex={selectedSex}
                   selectedScaleType={selectedScaleType}
                   selectedGenotypeDistributionBin={selectedGenotypeDistributionBin}
-                  setSelectedAncestryGroup={setSelectedAncestryGroup}
+                  setSelectedPopulation={setSelectedPopulation}
                   setSelectedSex={setSelectedSex}
                   setSelectedScaleType={setSelectedScaleType}
                   setSelectedGenotypeDistributionBin={setSelectedGenotypeDistributionBin}
@@ -623,10 +627,10 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         <ControlSection style={{ marginBottom: '1em' }}>
           <ShortTandemRepeatPopulationOptions
             id={`${shortTandemRepeat.id}-genotype-distribution`}
-            ancestryGroups={ancestryGroups}
-            selectedAncestryGroup={selectedAncestryGroup}
+            populations={populations}
+            selectedPopulation={selectedPopulation}
             selectedSex={selectedSex}
-            setSelectedAncestryGroup={setSelectedAncestryGroup}
+            setSelectedPopulation={setSelectedPopulation}
             setSelectedSex={setSelectedSex}
           />
         </ControlSection>
@@ -635,7 +639,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           shortTandemRepeat={shortTandemRepeat}
           maxRepeats={maxAlleleRepeats}
           alleleSizeDistributionRepeatUnits={alleleSizeDistributionRepunits}
-          filter={{ population: selectedAncestryGroup, sex: selectedSex }}
+          filter={{ population: selectedPopulation, sex: selectedSex }}
         />
       </section>
     </>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
index 210a7bccf..4410ac752 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
@@ -56,7 +56,7 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       q_score
       distribution {
         repunit_count
-        frequency
+        allele_count
       }
     }
     genotype_distribution {
@@ -69,7 +69,7 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       distribution {
         short_allele_repunit_count
         long_allele_repunit_count
-        frequency
+        genotype_count
       }
     }
     age_distribution {
@@ -96,7 +96,7 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       q_score
       distribution {
         repunit_count
-        frequency
+        allele_count
       }
     }
     genotype_distribution {
@@ -109,7 +109,7 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       distribution {
         short_allele_repunit_count
         long_allele_repunit_count
-        frequency
+        genotype_count
       }
     }
   }
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
index 96101dcde..0b419fcd9 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
@@ -3,10 +3,7 @@ import styled from 'styled-components'
 
 import { Select } from '@gnomad/ui'
 
-import {
-  AncestryGroupId,
-  GNOMAD_ANCESTRY_GROUP_NAMES,
-} from '@gnomad/dataset-metadata/gnomadPopulations'
+import { PopulationId, GNOMAD_POPULATION_NAMES } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 import { Sex } from './ShortTandemRepeatPage'
 
@@ -28,41 +25,41 @@ const Label = styled.label`
 
 type Props = {
   id: string
-  ancestryGroups: AncestryGroupId[]
-  selectedAncestryGroup: AncestryGroupId | ''
+  populations: PopulationId[]
+  selectedPopulation: PopulationId | ''
   selectedSex: Sex | ''
-  setSelectedAncestryGroup: Dispatch<SetStateAction<AncestryGroupId | ''>>
+  setSelectedPopulation: Dispatch<SetStateAction<PopulationId | ''>>
   setSelectedSex: Dispatch<SetStateAction<Sex | ''>>
 }
 
 const ShortTandemRepeatPopulationOptions = ({
   id,
-  ancestryGroups,
-  selectedAncestryGroup,
+  populations,
+  selectedPopulation,
   selectedSex,
-  setSelectedAncestryGroup,
+  setSelectedPopulation,
   setSelectedSex,
 }: Props) => {
-  const ancestryGroupsSortedByName = ancestryGroups.sort((group1, group2) =>
-    GNOMAD_ANCESTRY_GROUP_NAMES[group1].localeCompare(GNOMAD_ANCESTRY_GROUP_NAMES[group2])
+  const populationsSortedByName = populations.sort((group1, group2) =>
+    GNOMAD_POPULATION_NAMES[group1].localeCompare(GNOMAD_POPULATION_NAMES[group2])
   )
 
   return (
     <Wrapper>
       <Label htmlFor={`short-tandem-repeat-${id}-population-options-population`}>
-        Genetic ancestry group: &nbsp;
+        Population: &nbsp;
         {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
         <Select
           id={`short-tandem-repeat-${id}-population-options-population`}
-          value={selectedAncestryGroup}
-          onChange={(e: { target: { value: AncestryGroupId | '' } }) =>
-            setSelectedAncestryGroup(e.target.value)
+          value={selectedPopulation}
+          onChange={(e: { target: { value: PopulationId | '' } }) =>
+            setSelectedPopulation(e.target.value)
           }
         >
           <option value="">Global</option>
-          {ancestryGroupsSortedByName.map((ancestryGroup) => (
-            <option key={ancestryGroup} value={ancestryGroup}>
-              {GNOMAD_ANCESTRY_GROUP_NAMES[ancestryGroup]}
+          {populationsSortedByName.map((population) => (
+            <option key={population} value={population}>
+              {GNOMAD_POPULATION_NAMES[population]}
             </option>
           ))}
         </Select>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
index b36bbab57..2fbc3cf88 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
@@ -3,10 +3,7 @@ import styled from 'styled-components'
 
 import { Button, Input, Select } from '@gnomad/ui'
 
-import {
-  GNOMAD_POPULATION_NAMES,
-  AncestryGroupId,
-} from '@gnomad/dataset-metadata/gnomadPopulations'
+import { GNOMAD_POPULATION_NAMES, PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 import AttributeList, { AttributeListItem } from '../AttributeList'
 import Delayed from '../Delayed'
@@ -46,7 +43,7 @@ type ShortTandemRepeatReadProps = {
         lower: number
       }
     }[]
-    population: AncestryGroupId
+    population: PopulationId
     sex: string
     age?: string
     pcr_protocol: string
diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index 61ce2f7fb..3c3ee55c1 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -7,10 +7,10 @@ import {
   GenotypeDistributionItem,
   ShortTandemRepeatAdjacentRepeat,
 } from './ShortTandemRepeatPage'
-import { AncestryGroupId } from '@gnomad/dataset-metadata/gnomadPopulations'
+import { PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 type AlleleSizeDistributionFilters = {
-  selectedAncestryGroup: AncestryGroupId | ''
+  selectedPopulation: PopulationId | ''
   selectedSex: Sex | ''
   selectedRepeatUnit: string
 }
@@ -22,10 +22,11 @@ const addCohortToAlleleSizeDistribution = (
   cohort.distribution.reduce((acc, distributionItem) => {
     const { repunit_count } = distributionItem
     const existingItem = acc[repunit_count]
-    const countSoFar = existingItem ? existingItem.frequency : 0
+    const countSoFar = existingItem ? existingItem.allele_count : 0
     const newItem: AlleleSizeDistributionItem = {
       repunit_count: repunit_count,
-      frequency: countSoFar + distributionItem.frequency,
+      allele_count: countSoFar + distributionItem.allele_count,
+      manual_genotype_quality: distributionItem.manual_genotype_quality,
     }
     return { ...acc, [repunit_count]: newItem }
   }, distribution)
@@ -42,7 +43,7 @@ const repunitsWithClassification = (
 
 export const getSelectedAlleleSizeDistribution = (
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat,
-  { selectedAncestryGroup, selectedSex, selectedRepeatUnit }: AlleleSizeDistributionFilters
+  { selectedPopulation, selectedSex, selectedRepeatUnit }: AlleleSizeDistributionFilters
 ): AlleleSizeDistributionItem[] => {
   const matchingRepunits: Set<string> =
     selectedRepeatUnit.startsWith('classification') &&
@@ -50,9 +51,13 @@ export const getSelectedAlleleSizeDistribution = (
       ? repunitsWithClassification(shortTandemRepeatOrAdjacentRepeat, selectedRepeatUnit.slice(15))
       : new Set([selectedRepeatUnit])
 
+  console.log(
+    'shortTandemRepeatOrAdjacentRepeat.allele_size_distribution',
+    shortTandemRepeatOrAdjacentRepeat.allele_size_distribution
+  )
   const itemsByRepunitCount: Record<number, AlleleSizeDistributionItem> =
     shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.reduce((acc, cohort) => {
-      if (selectedAncestryGroup !== '' && cohort.ancestry_group !== selectedAncestryGroup) {
+      if (selectedPopulation !== '' && cohort.ancestry_group !== selectedPopulation) {
         return acc
       }
       if (selectedSex !== '' && cohort.sex !== selectedSex) {
@@ -64,6 +69,7 @@ export const getSelectedAlleleSizeDistribution = (
       }
       return addCohortToAlleleSizeDistribution(cohort, acc)
     }, {} as Record<number, AlleleSizeDistributionItem>)
+  console.log('itemsByRepunitCount', itemsByRepunitCount)
   return Object.values(itemsByRepunitCount)
 }
 
@@ -75,11 +81,11 @@ const addCohortToGenotypeDistribution = (
     const { short_allele_repunit_count, long_allele_repunit_count } = distributionItem
     const key = [short_allele_repunit_count, long_allele_repunit_count].join(' / ')
     const existingItem = acc[key]
-    const countSoFar = existingItem ? existingItem.frequency : 0
+    const countSoFar = existingItem ? existingItem.genotype_count : 0
     const newItem: GenotypeDistributionItem = {
       short_allele_repunit_count: short_allele_repunit_count,
       long_allele_repunit_count: long_allele_repunit_count,
-      frequency: countSoFar + distributionItem.frequency,
+      genotype_count: countSoFar + distributionItem.genotype_count,
     }
     return { ...acc, [key]: newItem }
   }, distribution)
@@ -88,17 +94,17 @@ export const getSelectedGenotypeDistribution = (
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat,
   {
     selectedRepeatUnits,
-    selectedAncestryGroup,
+    selectedPopulation,
     selectedSex,
   }: {
     selectedRepeatUnits: string[] | ''
-    selectedAncestryGroup: AncestryGroupId | ''
+    selectedPopulation: PopulationId | ''
     selectedSex: Sex | ''
   }
 ): GenotypeDistributionItem[] => {
   const itemsByRepunitCounts: Record<string, GenotypeDistributionItem> =
     shortTandemRepeatOrAdjacentRepeat.genotype_distribution.reduce((acc, cohort) => {
-      if (selectedAncestryGroup !== '' && cohort.ancestry_group !== selectedAncestryGroup) {
+      if (selectedPopulation !== '' && cohort.ancestry_group !== selectedPopulation) {
         return acc
       }
       if (selectedSex !== '' && cohort.sex !== selectedSex) {

From 72005cfc5a119671d1df894c206cd432820f7fa4 Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Wed, 30 Oct 2024 14:19:28 -0400
Subject: [PATCH 19/36] reverted variable names to match API

---
 ...ShortTandemRepeatAlleleSizeDistributionPlot.tsx |  4 ++--
 ...tTandemRepeatGenotypeDistributionBinDetails.tsx | 12 ++++--------
 .../ShortTandemRepeatGenotypeDistributionPlot.tsx  |  6 +++---
 .../ShortTandemRepeatPage.tsx                      | 12 ++++++++----
 .../ShortTandemRepeatPageContainer.tsx             |  8 ++++----
 .../shortTandemRepeatHelpers.ts                    | 14 ++++++++------
 6 files changed, 29 insertions(+), 27 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index d4899af45..1b24f620c 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -84,9 +84,9 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
         count: 0,
       }))
 
-      alleleSizeDistribution.forEach(({ repunit_count, allele_count }) => {
+      alleleSizeDistribution.forEach(({ repunit_count, frequency }) => {
         const binIndex = Math.floor(repunit_count / binSize)
-        d[binIndex].count += allele_count
+        d[binIndex].count += frequency
       })
 
       return d
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
index 3890dec1f..5600b7aa2 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
@@ -50,11 +50,11 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
       <List>
         {genotypeDistribution
           .filter(isInBin)
-          .map(({ long_allele_repunit_count, short_allele_repunit_count, genotype_count }) => (
+          .map(({ long_allele_repunit_count, short_allele_repunit_count, frequency }) => (
             // @ts-expect-error TS(2769) FIXME: No overload matches this call.
             <ListItem key={`${long_allele_repunit_count}/${short_allele_repunit_count}`}>
               {long_allele_repunit_count} repeats / {short_allele_repunit_count} repeats:{' '}
-              {genotype_count} individuals
+              {frequency} individuals
             </ListItem>
           ))}
       </List>
@@ -98,17 +98,13 @@ const ShortTandemRepeatGenotypeDistributionBinDetails = ({
                   {/* @ts-expect-error TS(2745) FIXME: This JSX tag's 'children' prop expects type 'never... Remove this comment to see the full error message */}
                   <List>
                     {distribution.map(
-                      ({
-                        short_allele_repunit_count,
-                        long_allele_repunit_count,
-                        genotype_count,
-                      }) => (
+                      ({ short_allele_repunit_count, long_allele_repunit_count, frequency }) => (
                         // @ts-expect-error TS(2769) FIXME: No overload matches this call.
                         <ListItem
                           key={`${long_allele_repunit_count}/${short_allele_repunit_count}`}
                         >
                           {long_allele_repunit_count} repeats / {short_allele_repunit_count}{' '}
-                          repeats: {genotype_count} individuals
+                          repeats: {frequency} individuals
                         </ListItem>
                       )
                     )}
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
index 69fd8d07d..cf4269fd6 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionPlot.tsx
@@ -104,10 +104,10 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
     })
 
     genotypeDistribution.forEach(
-      ({ short_allele_repunit_count, long_allele_repunit_count, genotype_count }) => {
+      ({ short_allele_repunit_count, long_allele_repunit_count, frequency }) => {
         const xBinIndex = Math.floor(short_allele_repunit_count / xBinSize)
         const yBinIndex = Math.floor(long_allele_repunit_count / yBinSize)
-        data[xBinIndex * yNumBins + yBinIndex].count += genotype_count
+        data[xBinIndex * yNumBins + yBinIndex].count += frequency
       }
     )
 
@@ -145,7 +145,7 @@ const ShortTandemRepeatGenotypeDistributionPlot = withSize()(
     }
 
     const opacityScale = scaleLog()
-      .domain([1, max(genotypeDistribution, (d) => d.genotype_count) || 2])
+      .domain([1, max(genotypeDistribution, (d) => d.frequency) || 2])
       .range([0.1, 1])
 
     return (
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index aff7f8c49..f43531788 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -41,12 +41,15 @@ export type GenotypeQuality = 'low' | 'medium-low' | 'medium' | 'medium-high' |
 
 export type AlleleSizeDistributionItem = {
   repunit_count: number
-  allele_count: number
-  manual_genotype_quality: GenotypeQuality
+  frequency: number
+  quality_description: GenotypeQuality
+  q_score: number
 }
 
 export type Sex = 'XX' | 'XY'
 
+export type ColorBy = 'ManualGenoypeQuality' | 'QScore' | 'Population' | 'Sex'
+
 export type AlleleSizeDistributionCohort = {
   ancestry_group: PopulationId
   sex: Sex
@@ -59,7 +62,7 @@ export type AlleleSizeDistributionCohort = {
 export type GenotypeDistributionItem = {
   short_allele_repunit_count: number
   long_allele_repunit_count: number
-  genotype_count: number
+  frequency: number
 }
 
 export type GenotypeDistributionCohort = {
@@ -163,6 +166,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
 
   const [selectedPopulation, setSelectedPopulation] = useState<PopulationId | ''>('')
   const [selectedSex, setSelectedSex] = useState<Sex | ''>('')
+  const [selectedColorBy, setColorBy] = useState<ColorBy | ''>('')
   const [selectedAlleleSizeRepeatUnit, setSelectedAlleleSizeRepeatUnit] =
     useState<string>(defaultAlleleSizeRepunit)
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
@@ -577,7 +581,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
         )}
       </section>
 
-      {shortTandemRepeat.adjacent_repeats.length > 0 && (
+      {false && (
         <section style={{ marginBottom: '3em' }}>
           <h2>
             Adjacent Repeats <InfoButton topic="str-adjacent-repeats" />
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
index 4410ac752..210a7bccf 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPageContainer.tsx
@@ -56,7 +56,7 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       q_score
       distribution {
         repunit_count
-        allele_count
+        frequency
       }
     }
     genotype_distribution {
@@ -69,7 +69,7 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       distribution {
         short_allele_repunit_count
         long_allele_repunit_count
-        genotype_count
+        frequency
       }
     }
     age_distribution {
@@ -96,7 +96,7 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       q_score
       distribution {
         repunit_count
-        allele_count
+        frequency
       }
     }
     genotype_distribution {
@@ -109,7 +109,7 @@ query ${operationName}($strId: String!, $datasetId: DatasetId!) {
       distribution {
         short_allele_repunit_count
         long_allele_repunit_count
-        genotype_count
+        frequency
       }
     }
   }
diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index 3c3ee55c1..5c67511ec 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -20,13 +20,15 @@ const addCohortToAlleleSizeDistribution = (
   distribution: Record<number, AlleleSizeDistributionItem>
 ): Record<number, AlleleSizeDistributionItem> =>
   cohort.distribution.reduce((acc, distributionItem) => {
-    const { repunit_count } = distributionItem
+    const { repunit_count, quality_description, q_score } = distributionItem
     const existingItem = acc[repunit_count]
-    const countSoFar = existingItem ? existingItem.allele_count : 0
+    const countSoFar = existingItem ? existingItem.frequency : 0
     const newItem: AlleleSizeDistributionItem = {
       repunit_count: repunit_count,
-      allele_count: countSoFar + distributionItem.allele_count,
-      manual_genotype_quality: distributionItem.manual_genotype_quality,
+      quality_description: quality_description,
+      q_score: q_score,
+
+      frequency: countSoFar + distributionItem.frequency,
     }
     return { ...acc, [repunit_count]: newItem }
   }, distribution)
@@ -81,11 +83,11 @@ const addCohortToGenotypeDistribution = (
     const { short_allele_repunit_count, long_allele_repunit_count } = distributionItem
     const key = [short_allele_repunit_count, long_allele_repunit_count].join(' / ')
     const existingItem = acc[key]
-    const countSoFar = existingItem ? existingItem.genotype_count : 0
+    const countSoFar = existingItem ? existingItem.frequency : 0
     const newItem: GenotypeDistributionItem = {
       short_allele_repunit_count: short_allele_repunit_count,
       long_allele_repunit_count: long_allele_repunit_count,
-      genotype_count: countSoFar + distributionItem.genotype_count,
+      frequency: countSoFar + distributionItem.frequency,
     }
     return { ...acc, [key]: newItem }
   }, distribution)

From 79a92bf4b21e6fb7e32a8801e9bb5f7a61a65a59 Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Thu, 31 Oct 2024 15:18:27 -0400
Subject: [PATCH 20/36] finished initial implementation of adding colors to
 histogram

---
 ...ShortTandemRepeatAdjacentRepeatSection.tsx |   8 +-
 ...TandemRepeatAlleleSizeDistributionPlot.tsx | 119 ++++++++++++++++--
 .../ShortTandemRepeatColorBySelect.tsx        |  36 ++++++
 ...emRepeatGenotypeDistributionBinDetails.tsx |   3 +-
 .../ShortTandemRepeatPage.tsx                 |  39 ++++--
 .../shortTandemRepeatHelpers.ts               |  58 ++++++---
 6 files changed, 223 insertions(+), 40 deletions(-)
 create mode 100644 browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
index 373cb72a8..73d9fd4d9 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
@@ -5,7 +5,7 @@ import { Modal, Select } from '@gnomad/ui'
 import ControlSection from '../VariantPage/ControlSection'
 
 import ShortTandemRepeatPopulationOptions from './ShortTandemRepeatPopulationOptions'
-import { ShortTandemRepeatAdjacentRepeat, ScaleType, Sex } from './ShortTandemRepeatPage'
+import { ShortTandemRepeatAdjacentRepeat, ScaleType, Sex, ColorBy } from './ShortTandemRepeatPage'
 import ShortTandemRepeatAlleleSizeDistributionPlot from './ShortTandemRepeatAlleleSizeDistributionPlot'
 import ShortTandemRepeatGenotypeDistributionPlot from './ShortTandemRepeatGenotypeDistributionPlot'
 import ShortTandemRepeatGenotypeDistributionBinDetails from './ShortTandemRepeatGenotypeDistributionBinDetails'
@@ -27,12 +27,14 @@ type Props = {
   selectedScaleType: ScaleType
   selectedPopulation: PopulationId | ''
   selectedSex: Sex | ''
+  selectedColorBy: ColorBy | ''
   populations: PopulationId[]
   selectedGenotypeDistributionBin: GenotypeBin | null
   setSelectedGenotypeDistributionBin: Dispatch<SetStateAction<GenotypeBin | null>>
   setSelectedScaleType: Dispatch<SetStateAction<ScaleType>>
   setSelectedPopulation: Dispatch<SetStateAction<PopulationId | ''>>
   setSelectedSex: Dispatch<SetStateAction<Sex | ''>>
+  setSelectedColorBy: Dispatch<SetStateAction<ColorBy | ''>>
 }
 
 const ShortTandemRepeatAdjacentRepeatSection = ({
@@ -41,9 +43,11 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
   selectedScaleType,
   selectedPopulation,
   selectedSex,
+  selectedColorBy,
   setSelectedScaleType,
   setSelectedPopulation,
   setSelectedSex,
+  setSelectedColorBy,
 }: Props) => {
   const [selectedRepeatUnit, setSelectedRepeatUnit] = useState(
     adjacentRepeat.repeat_units.length === 1 ? adjacentRepeat.repeat_units[0] : ''
@@ -69,8 +73,10 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
         alleleSizeDistribution={getSelectedAlleleSizeDistribution(adjacentRepeat, {
           selectedPopulation,
           selectedSex,
+          selectedColorBy,
           selectedRepeatUnit,
         })}
+        colorBy={selectedColorBy}
         repeatUnitLength={selectedRepeatUnit ? selectedRepeatUnit.length : null}
         scaleType={selectedScaleType}
       />
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index 1b24f620c..fe595337b 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -6,7 +6,15 @@ import styled from 'styled-components'
 import { AxisBottom, AxisLeft } from '@visx/axis'
 
 import { TooltipAnchor } from '@gnomad/ui'
-import { AlleleSizeDistributionItem, ScaleType } from './ShortTandemRepeatPage'
+import {
+  AlleleSizeDistributionItem,
+  ColorBy,
+  GenotypeQuality,
+  QScoreBin,
+  ScaleType,
+  Sex,
+} from './ShortTandemRepeatPage'
+import { PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 // The 100% width/height container is necessary the component
 // to size to fit its container vs staying at its initial size.
@@ -24,6 +32,49 @@ const TooltipTrigger = styled.rect`
   }
 `
 
+const colorMap: Record<string, Record<string, string>> = {
+  '': {
+    '': '#73ab3d',
+  },
+  quality_description: {
+    low: '#d73027',
+    'low-medium': '#fc8d59',
+    medium: '#fee08b',
+    'medium-high': '#d9ef8b',
+    high: '#1a9850',
+    'not-reviewed': '#aaaaaa',
+  },
+  q_score: {
+    '0.0': '#ff0000',
+    '0.1': '#ff3300',
+    '0.2': '#ff6600',
+    '0.3': '#ff9900',
+    '0.4': '#ffcc00',
+    '0.5': '#ffff00',
+    '0.6': '#ccff33',
+    '0.7': '#99ff66',
+    '0.8': '#66ff99',
+    '0.9': '#33ffcc',
+    '1.0': '#00ff00',
+  },
+  sex: {
+    XX: '#73ab3d',
+    XY: '#ff7f0e',
+  },
+  population: {
+    nfe: '#377eb8',
+    afr: '#4daf4a',
+    fin: '#e41a1c',
+    amr: '#984ea3',
+    ami: '#ff7f00',
+    asj: '#ffff33',
+    eas: '#a65628',
+    mid: '#f781bf',
+    oth: '#999999',
+    sas: '#a6cee3',
+  },
+}
+
 const tickFormat = (n: number) => {
   if (n >= 1e9) {
     return `${(n / 1e9).toPrecision(3)}B`
@@ -47,6 +98,7 @@ type Range = { start: number; stop: number; label: string }
 type Props = {
   maxRepeats: number
   alleleSizeDistribution: AlleleSizeDistributionItem[]
+  colorBy: ColorBy | ''
   repeatUnitLength: number | null
   scaleType: ScaleType
   ranges?: Range[]
@@ -57,6 +109,7 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
   ({
     maxRepeats,
     alleleSizeDistribution,
+    colorBy,
     repeatUnitLength,
     size: { width },
     scaleType = 'linear',
@@ -91,6 +144,55 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
 
       return d
     }, [alleleSizeDistribution, nBins, binSize])
+
+    // maps binIndex and colorByValue to a y and y start
+    const dataWithColor = useMemo(() => {
+      //sort by ColorBy value
+      alleleSizeDistribution.sort((a, b) => {
+        if (a.colorByValue < b.colorByValue) {
+          return 1
+        }
+        if (a.colorByValue > b.colorByValue) {
+          return -1
+        }
+        return 0
+      })
+
+      const d: Record<
+        string,
+        { binIndex: number; label: string; count: number; startCount: number; color: string }
+      > = {}
+
+      alleleSizeDistribution.forEach(({ repunit_count, colorByValue, frequency }) => {
+        const n = Math.floor(repunit_count / binSize)
+        const key = `${n}/${colorByValue}`
+        const labelPrefix = colorByValue ? `${colorByValue}: ` : ''
+        if (!d[key]) {
+          d[key] = {
+            binIndex: n,
+            label:
+              binSize === 1
+                ? `${labelPrefix} ${n}`
+                : `${labelPrefix} ${n * binSize} - ${n * binSize + binSize - 1}`,
+            count: 0,
+            startCount: 0,
+            color: colorMap[colorBy] ? colorMap[colorBy][colorByValue] : '#73ab3d',
+          }
+        }
+
+        d[key].count += frequency
+      })
+
+      return Object.values(d)
+    }, [alleleSizeDistribution, nBins, binSize])
+
+    const binCountCache = Array(nBins).fill(0)
+    dataWithColor.forEach((d) => {
+      d.startCount = binCountCache[d.binIndex]
+      console.log('data point:', d)
+      binCountCache[d.binIndex] += d.count
+    })
+
     const xScale = scaleBand<number>()
       .domain(data.map((d) => d.binIndex))
       .range([0, plotWidth])
@@ -198,16 +300,17 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
             />
           )}
           <g transform={`translate(${margin.left},${margin.top})`}>
-            {data.map((d) => {
-              const y = d.count === 0 ? plotHeight : yScale(d.count)
+            {dataWithColor.map((d) => {
+              const y = d.count === 0 ? 0 : yScale(d.count)
+              const yStart = d.startCount === 0 ? 0 : plotHeight - yScale(d.startCount)
               return (
-                <React.Fragment key={`${d.binIndex}`}>
+                <React.Fragment key={`${d.binIndex}-${d.color}`}>
                   <rect
                     x={xScale(d.binIndex)}
-                    y={y}
+                    y={y - yStart}
                     height={plotHeight - y}
                     width={xBandwidth}
-                    fill="#73ab3d"
+                    fill={d.color}
                     stroke="#333"
                   />
                   <TooltipAnchor
@@ -218,8 +321,8 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
                   >
                     <TooltipTrigger
                       x={xScale(d.binIndex)}
-                      y={0}
-                      height={plotHeight}
+                      y={y - yStart}
+                      height={plotHeight - y}
                       width={xBandwidth}
                       fill="none"
                       style={{ pointerEvents: 'visible' }}
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
new file mode 100644
index 000000000..34af165d3
--- /dev/null
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
@@ -0,0 +1,36 @@
+import React, { Dispatch, SetStateAction } from 'react'
+import styled from 'styled-components'
+
+import { Select } from '@gnomad/ui'
+import { ColorBy } from './ShortTandemRepeatPage'
+
+const Label = styled.label`
+  padding-right: 1em;
+`
+
+type Props = {
+  id: string
+  selectedColorBy: ColorBy | ''
+  setSelectedColorBy: Dispatch<SetStateAction<ColorBy | ''>>
+}
+
+const ShortTandemRepeatColorBySelect = ({ id, selectedColorBy, setSelectedColorBy }: Props) => {
+  return (
+    <Label htmlFor={`short-tandem-repeat-${id}-color-by-select`}>
+      Color By: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
+      <Select
+        id={`short-tandem-repeat-${id}-color-by-select`}
+        value={selectedColorBy}
+        onChange={(e: { target: { value: ColorBy | '' } }) => setSelectedColorBy(e.target.value)}
+      >
+        <option value="">None</option>
+        <option value="quality_description">GQ: manual review</option>
+        <option value="q_score">GQ: Q score</option>
+        <option value="sex">Sex</option>
+        <option value="population">Population</option>
+      </Select>
+    </Label>
+  )
+}
+
+export default ShortTandemRepeatColorBySelect
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
index 5600b7aa2..53d74d32d 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
@@ -9,11 +9,10 @@ import {
   GenotypeDistributionItem,
 } from './ShortTandemRepeatPage'
 import { getSelectedGenotypeDistribution } from './shortTandemRepeatHelpers'
-import { PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 type Props = {
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
-  selectedPopulation: PopulationId | ''
+  selectedPopulation: string | ''
   selectedSex: Sex | ''
   selectedRepeatUnits: string[] | ''
   repeatUnitPairs: string[][]
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index f43531788..f0dd15763 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -13,6 +13,7 @@ import ShortTandemRepeatAgeDistributionPlot from './ShortTandemRepeatAgeDistribu
 import ShortTandemRepeatAssociatedDiseasesTable from './ShortTandemRepeatAssociatedDiseasesTable'
 import ShortTandemRepeatAttributes from './ShortTandemRepeatAttributes'
 import ShortTandemRepeatPopulationOptions from './ShortTandemRepeatPopulationOptions'
+import ShortTandemRepeatColorBySelect from './ShortTandemRepeatColorBySelect'
 import ShortTandemRepeatAlleleSizeDistributionPlot from './ShortTandemRepeatAlleleSizeDistributionPlot'
 import ShortTandemRepeatGenotypeDistributionPlot, {
   Bin as GenotypeBin,
@@ -38,24 +39,35 @@ type ShortTandemRepeatReferenceRegion = {
 }
 
 export type GenotypeQuality = 'low' | 'medium-low' | 'medium' | 'medium-high' | 'high'
-
+export type QScoreBin =
+  | '0.0'
+  | '0.1'
+  | '0.2'
+  | '0.3'
+  | '0.4'
+  | '0.5'
+  | '0.6'
+  | '0.7'
+  | '0.8'
+  | '0.9'
+  | '1.0'
+export type ColorByValue = GenotypeQuality | QScoreBin | Sex | PopulationId | ''
 export type AlleleSizeDistributionItem = {
   repunit_count: number
   frequency: number
-  quality_description: GenotypeQuality
-  q_score: number
+  colorByValue: ColorByValue
 }
 
 export type Sex = 'XX' | 'XY'
 
-export type ColorBy = 'ManualGenoypeQuality' | 'QScore' | 'Population' | 'Sex'
+export type ColorBy = 'quality_description' | 'q_score' | 'population' | 'sex'
 
 export type AlleleSizeDistributionCohort = {
   ancestry_group: PopulationId
   sex: Sex
   repunit: string
-  quality_description: string
-  q_score: number
+  quality_description: GenotypeQuality
+  q_score: QScoreBin
   distribution: AlleleSizeDistributionItem[]
 }
 
@@ -70,8 +82,8 @@ export type GenotypeDistributionCohort = {
   sex: Sex
   short_allele_repunit: string
   long_allele_repunit: string
-  quality_description: string
-  q_score: number
+  quality_description: GenotypeQuality
+  q_score: QScoreBin
   distribution: GenotypeDistributionItem[]
 }
 
@@ -166,7 +178,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
 
   const [selectedPopulation, setSelectedPopulation] = useState<PopulationId | ''>('')
   const [selectedSex, setSelectedSex] = useState<Sex | ''>('')
-  const [selectedColorBy, setColorBy] = useState<ColorBy | ''>('')
+  const [selectedColorBy, setSelectedColorBy] = useState<ColorBy | ''>('')
   const [selectedAlleleSizeRepeatUnit, setSelectedAlleleSizeRepeatUnit] =
     useState<string>(defaultAlleleSizeRepunit)
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
@@ -301,8 +313,10 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           alleleSizeDistribution={getSelectedAlleleSizeDistribution(shortTandemRepeat, {
             selectedPopulation,
             selectedSex,
+            selectedColorBy,
             selectedRepeatUnit: selectedAlleleSizeRepeatUnit,
           })}
+          colorBy={selectedColorBy}
           repeatUnitLength={
             selectedAlleleSizeRepeatUnit &&
             !selectedAlleleSizeRepeatUnit.startsWith('classification')
@@ -329,6 +343,11 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
             setSelectedPopulation={setSelectedPopulation}
             setSelectedSex={setSelectedSex}
           />
+          <ShortTandemRepeatColorBySelect
+            id={`${shortTandemRepeat.id}-color-by`}
+            selectedColorBy={selectedColorBy}
+            setSelectedColorBy={setSelectedColorBy}
+          />
 
           {alleleSizeDistributionRepunits.length > 1 && (
             <label htmlFor={`short-tandem-repeat-${shortTandemRepeat.id}-repeat-unit`}>
@@ -595,10 +614,12 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
                   populations={populations}
                   selectedPopulation={selectedPopulation}
                   selectedSex={selectedSex}
+                  selectedColorBy={selectedColorBy}
                   selectedScaleType={selectedScaleType}
                   selectedGenotypeDistributionBin={selectedGenotypeDistributionBin}
                   setSelectedPopulation={setSelectedPopulation}
                   setSelectedSex={setSelectedSex}
+                  setSelectedColorBy={setSelectedColorBy}
                   setSelectedScaleType={setSelectedScaleType}
                   setSelectedGenotypeDistributionBin={setSelectedGenotypeDistributionBin}
                 />
diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index 5c67511ec..de1da8ba4 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -1,4 +1,6 @@
 import {
+  ColorBy,
+  GenotypeQuality,
   Sex,
   ShortTandemRepeat,
   AlleleSizeDistributionItem,
@@ -6,32 +8,45 @@ import {
   GenotypeDistributionCohort,
   GenotypeDistributionItem,
   ShortTandemRepeatAdjacentRepeat,
+  ColorByValue,
 } from './ShortTandemRepeatPage'
-import { PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
-type AlleleSizeDistributionFilters = {
-  selectedPopulation: PopulationId | ''
+type AlleleSizeDistributionParams = {
+  selectedPopulation: string | ''
   selectedSex: Sex | ''
+  selectedColorBy: ColorBy | ''
   selectedRepeatUnit: string
 }
 
 const addCohortToAlleleSizeDistribution = (
   cohort: AlleleSizeDistributionCohort,
-  distribution: Record<number, AlleleSizeDistributionItem>
-): Record<number, AlleleSizeDistributionItem> =>
-  cohort.distribution.reduce((acc, distributionItem) => {
-    const { repunit_count, quality_description, q_score } = distributionItem
-    const existingItem = acc[repunit_count]
+  colorBy: ColorBy | '',
+  distribution: Record<string, AlleleSizeDistributionItem>
+): Record<string, AlleleSizeDistributionItem> => {
+  let colorByValue: ColorByValue = ''
+  if (colorBy === 'quality_description') {
+    colorByValue = cohort.quality_description
+  } else if (colorBy === 'q_score') {
+    colorByValue = cohort.q_score
+  } else if (colorBy === 'sex') {
+    colorByValue = cohort.sex
+  } else if (colorBy === 'population') {
+    colorByValue = cohort.ancestry_group
+  }
+
+  return cohort.distribution.reduce((acc, distributionItem) => {
+    const { repunit_count } = distributionItem
+    const key = `${repunit_count}/${colorByValue}`
+    const existingItem = acc[key]
     const countSoFar = existingItem ? existingItem.frequency : 0
     const newItem: AlleleSizeDistributionItem = {
       repunit_count: repunit_count,
-      quality_description: quality_description,
-      q_score: q_score,
-
+      colorByValue: colorByValue,
       frequency: countSoFar + distributionItem.frequency,
     }
-    return { ...acc, [repunit_count]: newItem }
+    return { ...acc, [key]: newItem }
   }, distribution)
+}
 
 const repunitsWithClassification = (
   shortTandemRepeat: ShortTandemRepeat,
@@ -45,7 +60,12 @@ const repunitsWithClassification = (
 
 export const getSelectedAlleleSizeDistribution = (
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat,
-  { selectedPopulation, selectedSex, selectedRepeatUnit }: AlleleSizeDistributionFilters
+  {
+    selectedPopulation,
+    selectedSex,
+    selectedColorBy,
+    selectedRepeatUnit,
+  }: AlleleSizeDistributionParams
 ): AlleleSizeDistributionItem[] => {
   const matchingRepunits: Set<string> =
     selectedRepeatUnit.startsWith('classification') &&
@@ -53,10 +73,6 @@ export const getSelectedAlleleSizeDistribution = (
       ? repunitsWithClassification(shortTandemRepeatOrAdjacentRepeat, selectedRepeatUnit.slice(15))
       : new Set([selectedRepeatUnit])
 
-  console.log(
-    'shortTandemRepeatOrAdjacentRepeat.allele_size_distribution',
-    shortTandemRepeatOrAdjacentRepeat.allele_size_distribution
-  )
   const itemsByRepunitCount: Record<number, AlleleSizeDistributionItem> =
     shortTandemRepeatOrAdjacentRepeat.allele_size_distribution.reduce((acc, cohort) => {
       if (selectedPopulation !== '' && cohort.ancestry_group !== selectedPopulation) {
@@ -69,9 +85,11 @@ export const getSelectedAlleleSizeDistribution = (
       if (selectedRepeatUnit !== '' && !matchingRepunits.has(cohort.repunit)) {
         return acc
       }
-      return addCohortToAlleleSizeDistribution(cohort, acc)
+      return addCohortToAlleleSizeDistribution(cohort, selectedColorBy, acc)
     }, {} as Record<number, AlleleSizeDistributionItem>)
-  console.log('itemsByRepunitCount', itemsByRepunitCount)
+
+  //console.log('itemsByRepunitCount', itemsByRepunitCount)
+
   return Object.values(itemsByRepunitCount)
 }
 
@@ -100,7 +118,7 @@ export const getSelectedGenotypeDistribution = (
     selectedSex,
   }: {
     selectedRepeatUnits: string[] | ''
-    selectedPopulation: PopulationId | ''
+    selectedPopulation: string | ''
     selectedSex: Sex | ''
   }
 ): GenotypeDistributionItem[] => {

From 5a60d32a5377e17a277c56c12312687b16a36a4a Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Thu, 31 Oct 2024 15:21:58 -0400
Subject: [PATCH 21/36] renamed ancestryGroupId to populationId to match the
 main branch

---
 graphql-api/src/graphql/resolvers/va.ts | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/graphql-api/src/graphql/resolvers/va.ts b/graphql-api/src/graphql/resolvers/va.ts
index 790c3d33e..11b490cdf 100644
--- a/graphql-api/src/graphql/resolvers/va.ts
+++ b/graphql-api/src/graphql/resolvers/va.ts
@@ -209,14 +209,14 @@ const cohortDescription = (
     return `${capitalize(frequencyField)} Cohort`
   }
 
-  const [ancestryGroupId, sexId] = getAncestryAndSexIds(subsetId)
+  const [populationId, sexId] = getAncestryAndSexIds(subsetId)
 
-  if (ancestryGroupId) {
-    const ancestryGroupName = POPULATION_NAMES[ancestryGroupId]
+  if (populationId) {
+    const populationName = POPULATION_NAMES[populationId]
     if (sexId) {
-      return `${capitalize(frequencyField)} ${ancestryGroupName} ${sexId} Ancestry Group`
+      return `${capitalize(frequencyField)} ${populationName} ${sexId} Population`
     }
-    return `${capitalize(frequencyField)} ${ancestryGroupName} Ancestry Group`
+    return `${capitalize(frequencyField)} ${populationName} Population`
   }
   return sexId!
 }
@@ -226,17 +226,17 @@ const cohortForSubset = (subset: Subset, frequencyField: 'exome' | 'genome'): Co
     return { id: 'ALL', label: capitalize(frequencyField), characteristics: null }
   }
 
-  const [ancestryGroupId, sexId] = getAncestryAndSexIds(subset.id)
+  const [populationId, sexId] = getAncestryAndSexIds(subset.id)
 
   const sexCharacteristics: CohortCharacteristic[] = sexId
     ? [{ name: 'biological sex', value: sexId }]
     : []
   const ancestryCharacteristics: CohortCharacteristic[] =
-    ancestryGroupId && POPULATION_NAMES[ancestryGroupId]
+    populationId && POPULATION_NAMES[populationId]
       ? [
           {
             name: 'genetic ancestry',
-            value: POPULATION_NAMES[ancestryGroupId],
+            value: POPULATION_NAMES[populationId],
           },
         ]
       : []

From 92573a3e4fbe8d0b5ff04fa95f39e187a9bbdc53 Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Thu, 31 Oct 2024 15:22:41 -0400
Subject: [PATCH 22/36] updated shortTandemRepeatFactory

---
 browser/src/__factories__/ShortTandemRepeat.ts | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/browser/src/__factories__/ShortTandemRepeat.ts b/browser/src/__factories__/ShortTandemRepeat.ts
index 81f0d59a9..716782eeb 100644
--- a/browser/src/__factories__/ShortTandemRepeat.ts
+++ b/browser/src/__factories__/ShortTandemRepeat.ts
@@ -35,10 +35,10 @@ const shortTandemRepeatFactory = Factory.define<ShortTandemRepeat>(({ params, as
         sex: 'XY',
         repunit: 'ACCA',
         quality_description: 'medium-low',
-        q_score: 0.6,
+        q_score: '0.6',
         distribution: [
-          { repunit_count: 3, frequency: 12 },
-          { repunit_count: 4, frequency: 123 },
+          { repunit_count: 3, frequency: 12, colorByValue: 'low' },
+          { repunit_count: 4, frequency: 123, colorByValue: 'high' },
         ],
       },
     ],
@@ -49,7 +49,7 @@ const shortTandemRepeatFactory = Factory.define<ShortTandemRepeat>(({ params, as
         short_allele_repunit: 'ACCA',
         long_allele_repunit: 'GATA',
         quality_description: 'high',
-        q_score: 1.0,
+        q_score: '1.0',
         distribution: [
           { short_allele_repunit_count: 8, long_allele_repunit_count: 9, frequency: 15 },
           { short_allele_repunit_count: 8, long_allele_repunit_count: 10, frequency: 19 },

From 83d0e32fe02355166a6a7343a30bf728d22ee5dc Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 4 Nov 2024 14:46:31 -0500
Subject: [PATCH 23/36] fixup: update snapshots

---
 .../ShortTandemRepeatPage.spec.tsx.snap       | 11160 ++++++++++++----
 ...ortTandemRepeatPageContainer.spec.tsx.snap |  1976 ++-
 2 files changed, 9190 insertions(+), 3946 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/__snapshots__/ShortTandemRepeatPage.spec.tsx.snap b/browser/src/ShortTandemRepeatPage/__snapshots__/ShortTandemRepeatPage.spec.tsx.snap
index 73a9953c4..1a9bb5445 100644
--- a/browser/src/ShortTandemRepeatPage/__snapshots__/ShortTandemRepeatPage.spec.tsx.snap
+++ b/browser/src/ShortTandemRepeatPage/__snapshots__/ShortTandemRepeatPage.spec.tsx.snap
@@ -14,16 +14,49 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -55,17 +88,46 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -86,17 +148,24 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -119,16 +188,49 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -160,17 +262,46 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -195,33 +326,22 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -233,28 +353,21 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -277,6 +390,20 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -294,56 +421,38 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -354,25 +463,70 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -404,23 +558,51 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -452,7 +634,31 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -490,33 +696,78 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="exac"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -548,17 +799,46 @@ exports[`ShortTandemRepeatPage with "exac" dataset has no unexected changes 1`]
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -583,16 +863,49 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -624,17 +937,46 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
-            "id": "STR1",
-            "reference_region": {
-              "chrom": "1",
-              "start": 10000000,
-              "stop": 15000000,
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
+            "id": "STR1",
+            "main_reference_region": {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -655,17 +997,24 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -688,16 +1037,49 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -729,17 +1111,46 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -764,33 +1175,22 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -802,28 +1202,21 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -846,6 +1239,20 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -863,56 +1270,38 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -923,25 +1312,70 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -973,23 +1407,51 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -1021,7 +1483,31 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -1059,33 +1545,78 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_cnv_r4"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -1117,17 +1648,46 @@ exports[`ShortTandemRepeatPage with "gnomad_cnv_r4" dataset has no unexected cha
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -1152,16 +1712,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -1193,17 +1786,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -1224,17 +1846,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
-        </List>
-      </React.Fragment>
-      <h2>
-        Related Loci
-      </h2>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
+        </List>
+      </React.Fragment>
+      <h2>
+        TRs in gnomAD
+      </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -1257,16 +1886,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -1298,17 +1960,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -1333,33 +2024,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -1371,28 +2051,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -1415,6 +2088,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -1432,56 +2119,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
-        ]
-      }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -1492,25 +2161,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -1542,23 +2256,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -1590,7 +2332,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -1628,33 +2394,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r2_1"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -1686,17 +2497,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1" dataset has no unexected chang
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -1721,16 +2561,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -1762,17 +2635,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -1793,17 +2695,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -1826,21 +2735,54 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
-            "associated_diseases": [
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
               {
-                "inheritance_mode": "Autosomal dominant",
-                "name": "disease",
-                "notes": "hello world",
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
+            "associated_diseases": [
+              {
+                "inheritance_mode": "Autosomal dominant",
+                "name": "disease",
+                "notes": "hello world",
                 "omim_id": "123456",
                 "repeat_size_classifications": [
                   {
@@ -1867,17 +2809,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -1901,34 +2872,23 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
     </h2>
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
-        [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -1940,28 +2900,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -1984,6 +2937,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -2001,56 +2968,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -2061,25 +3010,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -2111,23 +3105,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -2159,7 +3181,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -2197,33 +3243,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r2_1_controls"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -2255,17 +3346,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_controls" dataset has no unexec
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -2290,16 +3410,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -2331,17 +3484,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -2362,17 +3544,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -2395,16 +3584,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -2436,20 +3658,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
-            "id": "STR1",
-            "reference_region": {
-              "chrom": "1",
-              "start": 10000000,
-              "stop": 15000000,
-            },
-            "reference_repeat_unit": "CTG",
-            "repeat_units": [],
-            "stripy_id": "STR1",
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
+            "id": "STR1",
+            "main_reference_region": {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
+            "reference_repeat_unit": "CTG",
+            "repeat_units": [],
+            "stripy_id": "STR1",
           }
         }
       />
@@ -2471,33 +3722,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -2509,28 +3749,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -2553,6 +3786,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -2570,56 +3817,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -2630,25 +3859,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -2680,23 +3954,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -2728,7 +4030,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -2766,33 +4092,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r2_1_non_cancer"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -2824,17 +4195,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_cancer" dataset has no unex
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -2859,16 +4259,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -2900,17 +4333,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -2931,17 +4393,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -2964,16 +4433,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -3005,17 +4507,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -3040,33 +4571,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -3078,28 +4598,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -3122,6 +4635,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -3139,56 +4666,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -3199,25 +4708,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -3249,23 +4803,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -3297,7 +4879,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -3335,33 +4941,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r2_1_non_neuro"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -3393,17 +5044,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_neuro" dataset has no unexe
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -3428,16 +5108,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -3469,17 +5182,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -3500,17 +5242,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -3533,16 +5282,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -3574,17 +5356,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -3609,33 +5420,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -3647,30 +5447,23 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
       <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
-      <label
-        htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
+        htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
         Scale: 
         <Select
@@ -3691,6 +5484,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -3708,56 +5515,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -3768,25 +5557,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -3818,23 +5652,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -3866,7 +5728,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -3904,33 +5790,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r2_1_non_topmed"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -3962,17 +5893,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r2_1_non_topmed" dataset has no unex
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -3997,16 +5957,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -4038,17 +6031,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -4069,17 +6091,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -4102,16 +6131,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -4143,17 +6205,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -4178,33 +6269,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -4216,28 +6296,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -4260,14 +6333,28 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
         </Select>
       </label>
     </ControlSection>
-  </section>
-  <section
-    style={
-      {
-        "marginBottom": "3em",
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
       }
-    }
-  >
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
+  </section>
+  <section
+    style={
+      {
+        "marginBottom": "3em",
+      }
+    }
+  >
     <h2>
       Genotype Distribution 
       <InfoButton
@@ -4277,56 +6364,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -4337,25 +6406,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -4387,23 +6501,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -4435,7 +6577,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -4473,33 +6639,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r3"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -4531,17 +6742,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3" dataset has no unexected changes
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -4566,16 +6806,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -4607,17 +6880,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -4638,17 +6940,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -4671,16 +6980,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -4712,17 +7054,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -4747,33 +7118,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -4785,28 +7145,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -4829,6 +7182,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -4846,56 +7213,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -4906,25 +7255,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -4956,23 +7350,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -5004,7 +7426,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -5042,33 +7488,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r3_controls_and_biobanks"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -5100,17 +7591,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_controls_and_biobanks" dataset ha
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -5135,16 +7655,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -5176,17 +7729,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -5207,17 +7789,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -5240,16 +7829,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -5281,17 +7903,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -5316,33 +7967,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -5354,28 +7994,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -5398,6 +8031,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -5415,56 +8062,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -5475,25 +8104,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -5525,23 +8199,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -5573,7 +8275,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -5611,33 +8337,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r3_non_cancer"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -5669,17 +8440,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_cancer" dataset has no unexec
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -5704,16 +8504,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -5745,17 +8578,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -5776,17 +8638,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -5809,16 +8678,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -5850,17 +8752,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -5885,33 +8816,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -5923,28 +8843,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -5967,6 +8880,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -5984,56 +8911,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
-        ]
-      }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -6044,31 +8953,76 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
-            "associated_diseases": [
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
               {
-                "inheritance_mode": "Autosomal dominant",
-                "name": "disease",
-                "notes": "hello world",
-                "omim_id": "123456",
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
+            "associated_diseases": [
+              {
+                "inheritance_mode": "Autosomal dominant",
+                "name": "disease",
+                "notes": "hello world",
+                "omim_id": "123456",
                 "repeat_size_classifications": [
                   {
                     "classification": "Normal",
@@ -6094,23 +9048,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -6142,7 +9124,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -6180,33 +9186,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r3_non_neuro"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -6238,17 +9289,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_neuro" dataset has no unexect
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -6273,16 +9353,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -6314,17 +9427,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -6345,17 +9487,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -6378,16 +9527,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -6419,17 +9601,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -6454,33 +9665,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -6492,28 +9692,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -6536,6 +9729,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -6553,56 +9760,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -6613,25 +9802,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -6663,23 +9897,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
-            "id": "STR1",
-            "reference_region": {
-              "chrom": "1",
-              "start": 10000000,
-              "stop": 15000000,
-            },
-            "reference_repeat_unit": "CTG",
-            "repeat_units": [],
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
+            "id": "STR1",
+            "main_reference_region": {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
+            "reference_repeat_unit": "CTG",
+            "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -6711,7 +9973,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -6749,33 +10035,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r3_non_topmed"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -6807,17 +10138,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_topmed" dataset has no unexec
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -6842,16 +10202,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -6883,17 +10276,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -6914,17 +10336,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -6947,16 +10376,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -6988,17 +10450,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -7023,33 +10514,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -7061,28 +10541,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -7105,6 +10578,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -7122,56 +10609,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -7182,25 +10651,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -7232,23 +10746,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -7280,8 +10822,32 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
-      ranges={
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
+      ranges={
         [
           {
             "label": "Normal",
@@ -7318,33 +10884,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r3_non_v2"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -7376,17 +10987,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r3_non_v2" dataset has no unexected
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -7411,16 +11051,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -7452,17 +11125,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -7483,17 +11185,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -7516,16 +11225,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -7557,17 +11299,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -7591,34 +11362,23 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
     </h2>
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
-        [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -7630,28 +11390,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -7674,6 +11427,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -7691,56 +11458,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -7751,25 +11500,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -7801,23 +11595,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -7849,7 +11671,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -7887,33 +11733,78 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r4"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -7945,17 +11836,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r4" dataset has no unexected changes
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -7980,16 +11900,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -8021,17 +11974,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -8052,17 +12034,24 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -8085,16 +12074,49 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -8126,17 +12148,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -8161,33 +12212,22 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -8199,28 +12239,21 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -8243,6 +12276,20 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -8260,56 +12307,38 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -8320,25 +12349,70 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -8370,23 +12444,51 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -8418,7 +12520,31 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -8456,39 +12582,84 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_r4_non_ukb"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
-          "associated_diseases": [
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
             {
-              "inheritance_mode": "Autosomal dominant",
-              "name": "disease",
-              "notes": "hello world",
-              "omim_id": "123456",
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
+          "associated_diseases": [
+            {
+              "inheritance_mode": "Autosomal dominant",
+              "name": "disease",
+              "notes": "hello world",
+              "omim_id": "123456",
               "repeat_size_classifications": [
                 {
                   "classification": "Normal",
@@ -8514,17 +12685,46 @@ exports[`ShortTandemRepeatPage with "gnomad_r4_non_ukb" dataset has no unexected
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -8549,16 +12749,49 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -8590,17 +12823,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -8621,17 +12883,24 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -8654,16 +12923,49 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -8695,17 +12997,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -8729,34 +13060,23 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
     </h2>
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
-        [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -8768,28 +13088,21 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -8812,6 +13125,20 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -8829,56 +13156,38 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -8889,25 +13198,70 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -8939,23 +13293,51 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -8987,7 +13369,31 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -9025,33 +13431,78 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_sv_r2_1"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -9083,17 +13534,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1" dataset has no unexected ch
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
-          "id": "STR1",
-          "reference_region": {
-            "chrom": "1",
-            "start": 10000000,
-            "stop": 15000000,
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
+          "id": "STR1",
+          "main_reference_region": {
+            "chrom": "1",
+            "start": 10000000,
+            "stop": 15000000,
+          },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -9118,16 +13598,49 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -9159,17 +13672,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -9190,17 +13732,24 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -9223,16 +13772,49 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -9264,17 +13846,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -9298,34 +13909,23 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
     </h2>
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
-        [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -9337,28 +13937,21 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -9381,6 +13974,20 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -9398,56 +14005,38 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
-        ]
-      }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -9458,25 +14047,70 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -9508,23 +14142,51 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -9556,7 +14218,31 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -9594,33 +14280,78 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_sv_r2_1_controls"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -9652,17 +14383,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_controls" dataset has no une
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -9687,16 +14447,49 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -9728,17 +14521,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -9759,17 +14581,24 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -9792,16 +14621,49 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -9833,17 +14695,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -9867,34 +14758,23 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
     </h2>
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
-        [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -9906,28 +14786,21 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -9950,6 +14823,20 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -9967,56 +14854,38 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
-        ]
-      }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -10027,25 +14896,70 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -10077,23 +14991,51 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -10125,7 +15067,31 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -10163,33 +15129,78 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_sv_r2_1_non_neuro"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -10221,17 +15232,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r2_1_non_neuro" dataset has no un
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
@@ -10256,16 +15296,49 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -10297,17 +15370,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -10328,17 +15430,24 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
               STRipy
             </Link__ExternalLink>
           </List__ListItem>
+          <List__ListItem>
+            <Link__ExternalLink
+              href="https://strchive.org/database/STR1.html"
+            >
+              STRchive
+            </Link__ExternalLink>
+          </List__ListItem>
         </List>
       </React.Fragment>
       <h2>
-        Related Loci
+        TRs in gnomAD
       </h2>
       <p>
         <withRouter()
           preserveSelectedDataset={true}
           to="/short-tandem-repeats"
         >
-          Table of tandem repeat loci in gnomAD
+          Known disease-associated TRs 
         </withRouter()>
       </p>
     </ShortTandemRepeatPage__ResponsiveSection>
@@ -10361,16 +15470,49 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
         shortTandemRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -10402,17 +15544,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
@@ -10437,33 +15608,22 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
     <ShortTandemRepeatAlleleSizeDistributionPlot
       alleleSizeDistribution={
         [
-          [
-            1,
-            1,
-          ],
-        ]
-      }
-      maxRepeats={1}
-      ranges={
-        [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "colorByValue": "",
+            "frequency": 12,
+            "repunit_count": 3,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "colorByValue": "",
+            "frequency": 123,
+            "repunit_count": 4,
           },
         ]
       }
-      repeatUnitLength={null}
+      colorBy=""
+      maxRepeats={4}
+      ranges={[]}
+      repeatUnitLength={4}
       scaleType="linear"
     />
     <ControlSection
@@ -10475,28 +15635,21 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-repeat-counts"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
+      />
+      <ShortTandemRepeatColorBySelect
+        id="STR1-color-by"
+        selectedColorBy=""
+        setSelectedColorBy={[Function]}
       />
-      <label
-        htmlFor="short-tandem-repeat-STR1-repeat-unit"
-      >
-        Repeat unit: 
-        <Select
-          id="short-tandem-repeat-STR1-repeat-unit"
-          onChange={[Function]}
-          value=""
-        >
-          <React.Fragment>
-            <option
-              value=""
-            >
-              All
-            </option>
-          </React.Fragment>
-        </Select>
-      </label>
       <label
         htmlFor="short-tandem-repeat-STR1-allele-size-distribution-scale"
       >
@@ -10519,6 +15672,20 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
         </Select>
       </label>
     </ControlSection>
+    <p
+      style={
+        {
+          "marginBottom": 0,
+        }
+      }
+    >
+      <Badge
+        level="info"
+      >
+        Note
+      </Badge>
+       This plot includes non-pathogenic repeat units. Use the “Repeat unit” menu to view specific repeat units.
+    </p>
   </section>
   <section
     style={
@@ -10536,56 +15703,38 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
     <ShortTandemRepeatGenotypeDistributionPlot
       axisLabels={
         [
-          "longer allele",
-          "shorter allele",
-        ]
-      }
-      genotypeDistribution={[]}
-      maxRepeats={
-        [
-          undefined,
-          undefined,
+          "ACCA allele",
+          "GATA allele",
         ]
       }
-      onSelectBin={[Function]}
-      xRanges={
+      genotypeDistribution={
         [
           {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
+            "frequency": 15,
+            "long_allele_repunit_count": 9,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
+            "frequency": 19,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 8,
           },
           {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
+            "frequency": 17,
+            "long_allele_repunit_count": 10,
+            "short_allele_repunit_count": 9,
           },
         ]
       }
-      yRanges={
+      maxRepeats={
         [
-          {
-            "label": "Normal",
-            "start": 0,
-            "stop": 33,
-          },
-          {
-            "label": "Intermediate",
-            "start": 36,
-            "stop": 39,
-          },
-          {
-            "label": "Pathogenic",
-            "start": 39,
-            "stop": Infinity,
-          },
+          10,
+          9,
         ]
       }
+      onSelectBin={[Function]}
+      xRanges={[]}
+      yRanges={[]}
     />
     <ControlSection
       style={
@@ -10596,25 +15745,70 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
     >
       <ShortTandemRepeatPopulationOptions
         id="STR1-genotype-distribution"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
       <ShortTandemRepeatGenotypeDistributionRepeatUnitsSelect
-        onChange={[Function]}
+        selectedRepeatUnits={
+          [
+            "ACCA",
+            "GATA",
+          ]
+        }
+        setSelectedRepeatUnits={[Function]}
         shortTandemRepeatOrAdjacentRepeat={
           {
             "adjacent_repeats": [],
-            "allele_size_distribution": {
-              "distribution": [
-                [
-                  1,
-                  1,
+            "age_distribution": [
+              {
+                "age_range": [
+                  null,
+                  18,
                 ],
-              ],
-              "populations": [],
-              "repeat_units": [],
-            },
+                "distribution": [
+                  [
+                    8,
+                    6,
+                  ],
+                  [
+                    9,
+                    3,
+                  ],
+                  [
+                    10,
+                    9,
+                  ],
+                ],
+              },
+            ],
+            "allele_size_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "colorByValue": "low",
+                    "frequency": 12,
+                    "repunit_count": 3,
+                  },
+                  {
+                    "colorByValue": "high",
+                    "frequency": 123,
+                    "repunit_count": 4,
+                  },
+                ],
+                "q_score": "0.6",
+                "quality_description": "medium-low",
+                "repunit": "ACCA",
+                "sex": "XY",
+              },
+            ],
             "associated_diseases": [
               {
                 "inheritance_mode": "Autosomal dominant",
@@ -10646,23 +15840,51 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
               "region": "coding:polyglutamine",
               "symbol": "ABCD1",
             },
-            "genotype_distribution": {
-              "distribution": [],
-              "populations": [],
-              "repeat_units": [],
-            },
+            "genotype_distribution": [
+              {
+                "ancestry_group": "asj",
+                "distribution": [
+                  {
+                    "frequency": 15,
+                    "long_allele_repunit_count": 9,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 19,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 8,
+                  },
+                  {
+                    "frequency": 17,
+                    "long_allele_repunit_count": 10,
+                    "short_allele_repunit_count": 9,
+                  },
+                ],
+                "long_allele_repunit": "GATA",
+                "q_score": "1.0",
+                "quality_description": "high",
+                "sex": "XY",
+                "short_allele_repunit": "ACCA",
+              },
+            ],
             "id": "STR1",
-            "reference_region": {
+            "main_reference_region": {
               "chrom": "1",
               "start": 10000000,
               "stop": 15000000,
             },
+            "reference_regions": [
+              {
+                "chrom": "1",
+                "start": 10000000,
+                "stop": 15000000,
+              },
+            ],
             "reference_repeat_unit": "CTG",
             "repeat_units": [],
             "stripy_id": "STR1",
           }
         }
-        value=""
       />
     </ControlSection>
     <p
@@ -10694,7 +15916,31 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
       />
     </h2>
     <ShortTandemRepeatAgeDistributionPlot
-      maxRepeats={1}
+      ageDistribution={
+        [
+          {
+            "age_range": [
+              null,
+              18,
+            ],
+            "distribution": [
+              [
+                8,
+                6,
+              ],
+              [
+                9,
+                3,
+              ],
+              [
+                10,
+                9,
+              ],
+            ],
+          },
+        ]
+      }
+      maxRepeats={4}
       ranges={
         [
           {
@@ -10732,33 +15978,78 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
       }
     >
       <ShortTandemRepeatPopulationOptions
-        id="STR1-read-data"
-        onSelectPopulationId={[Function]}
-        populationIds={[]}
-        selectedPopulationId=""
+        id="STR1-genotype-distribution"
+        populations={
+          [
+            "asj",
+          ]
+        }
+        selectedPopulation=""
+        selectedSex=""
+        setSelectedPopulation={[Function]}
+        setSelectedSex={[Function]}
       />
     </ControlSection>
     <ShortTandemRepeatReadsContainer
+      alleleSizeDistributionRepeatUnits={
+        [
+          "ACCA",
+        ]
+      }
       datasetId="gnomad_sv_r4"
       filter={
         {
           "population": "",
-          "sex": null,
+          "sex": "",
         }
       }
+      maxRepeats={4}
       shortTandemRepeat={
         {
           "adjacent_repeats": [],
-          "allele_size_distribution": {
-            "distribution": [
-              [
-                1,
-                1,
+          "age_distribution": [
+            {
+              "age_range": [
+                null,
+                18,
               ],
-            ],
-            "populations": [],
-            "repeat_units": [],
-          },
+              "distribution": [
+                [
+                  8,
+                  6,
+                ],
+                [
+                  9,
+                  3,
+                ],
+                [
+                  10,
+                  9,
+                ],
+              ],
+            },
+          ],
+          "allele_size_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "colorByValue": "low",
+                  "frequency": 12,
+                  "repunit_count": 3,
+                },
+                {
+                  "colorByValue": "high",
+                  "frequency": 123,
+                  "repunit_count": 4,
+                },
+              ],
+              "q_score": "0.6",
+              "quality_description": "medium-low",
+              "repunit": "ACCA",
+              "sex": "XY",
+            },
+          ],
           "associated_diseases": [
             {
               "inheritance_mode": "Autosomal dominant",
@@ -10790,17 +16081,46 @@ exports[`ShortTandemRepeatPage with "gnomad_sv_r4" dataset has no unexected chan
             "region": "coding:polyglutamine",
             "symbol": "ABCD1",
           },
-          "genotype_distribution": {
-            "distribution": [],
-            "populations": [],
-            "repeat_units": [],
-          },
+          "genotype_distribution": [
+            {
+              "ancestry_group": "asj",
+              "distribution": [
+                {
+                  "frequency": 15,
+                  "long_allele_repunit_count": 9,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 19,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 8,
+                },
+                {
+                  "frequency": 17,
+                  "long_allele_repunit_count": 10,
+                  "short_allele_repunit_count": 9,
+                },
+              ],
+              "long_allele_repunit": "GATA",
+              "q_score": "1.0",
+              "quality_description": "high",
+              "sex": "XY",
+              "short_allele_repunit": "ACCA",
+            },
+          ],
           "id": "STR1",
-          "reference_region": {
+          "main_reference_region": {
             "chrom": "1",
             "start": 10000000,
             "stop": 15000000,
           },
+          "reference_regions": [
+            {
+              "chrom": "1",
+              "start": 10000000,
+              "stop": 15000000,
+            },
+          ],
           "reference_repeat_unit": "CTG",
           "repeat_units": [],
           "stripy_id": "STR1",
diff --git a/browser/src/ShortTandemRepeatPage/__snapshots__/ShortTandemRepeatPageContainer.spec.tsx.snap b/browser/src/ShortTandemRepeatPage/__snapshots__/ShortTandemRepeatPageContainer.spec.tsx.snap
index 3ea664240..7f276e72e 100644
--- a/browser/src/ShortTandemRepeatPage/__snapshots__/ShortTandemRepeatPageContainer.spec.tsx.snap
+++ b/browser/src/ShortTandemRepeatPage/__snapshots__/ShortTandemRepeatPageContainer.spec.tsx.snap
@@ -49,7 +49,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -60,33 +67,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -97,41 +98,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -200,7 +196,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -211,33 +214,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -248,41 +245,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -351,7 +343,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -362,33 +361,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -399,41 +392,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -502,7 +490,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -513,33 +508,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -550,41 +539,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -653,7 +637,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -664,33 +655,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -701,41 +686,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -804,7 +784,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -815,33 +802,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -852,41 +833,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -955,7 +931,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -966,33 +949,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -1003,41 +980,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -1106,7 +1078,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -1117,33 +1096,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -1154,41 +1127,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -1257,7 +1225,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -1268,33 +1243,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -1305,41 +1274,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -1408,7 +1372,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -1419,33 +1390,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -1456,41 +1421,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -1559,7 +1519,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -1570,33 +1537,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -1607,41 +1568,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -1710,7 +1666,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -1721,33 +1684,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -1758,41 +1715,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -1861,7 +1813,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -1872,33 +1831,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -1909,41 +1862,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -2012,7 +1960,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -2023,33 +1978,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -2060,41 +2009,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -2163,7 +2107,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -2174,33 +2125,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -2211,41 +2156,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -2314,7 +2254,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -2325,33 +2272,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -2362,41 +2303,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -2465,7 +2401,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -2476,33 +2419,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -2513,41 +2450,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -2616,7 +2548,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -2627,33 +2566,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -2664,41 +2597,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }
@@ -2767,7 +2695,14 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       }
       notes
     }
-    reference_region {
+    main_reference_region {
+      reference_genome
+      chrom
+      start
+      stop
+    }
+    reference_regions {
+      reference_genome
       chrom
       start
       stop
@@ -2778,33 +2713,27 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
       classification
     }
     allele_size_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_unit
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
       }
     }
     genotype_distribution {
-      distribution
-      populations {
-        id
-        distribution
-      }
-      repeat_units {
-        repeat_units
-        distribution
-        populations {
-          id
-          distribution
-        }
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
     age_distribution {
@@ -2815,41 +2744,36 @@ query ShortTandemRepeat($strId: String!, $datasetId: DatasetId!) {
     adjacent_repeats {
       id
       reference_region {
+        reference_genome
         chrom
         start
         stop
       }
       reference_repeat_unit
       repeat_units
-      allele_size_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_unit
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
-      }
-      genotype_distribution {
-        distribution
-        populations {
-          id
-          distribution
-        }
-        repeat_units {
-          repeat_units
-          distribution
-          populations {
-            id
-            distribution
-          }
-        }
+    }
+    allele_size_distribution {
+      ancestry_group
+      sex
+      repunit
+      quality_description
+      q_score
+      distribution {
+        repunit_count
+        frequency
+      }
+    }
+    genotype_distribution {
+      ancestry_group
+      sex
+      short_allele_repunit
+      long_allele_repunit
+      quality_description
+      q_score
+      distribution {
+        short_allele_repunit_count
+        long_allele_repunit_count
+        frequency
       }
     }
   }

From 731713f87a2aa3a47901f7814e6e7daf7d2dbbd8 Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Thu, 7 Nov 2024 22:55:32 -0700
Subject: [PATCH 24/36] added 'Linear: Truncated' scale option

---
 .../ShortTandemRepeatAdjacentRepeatSection.tsx    |  3 ++-
 ...hortTandemRepeatAlleleSizeDistributionPlot.tsx |  3 ++-
 .../ShortTandemRepeatColorBySelect.tsx            | 15 ++++++++++++---
 .../ShortTandemRepeatPage.tsx                     |  6 ++++--
 4 files changed, 20 insertions(+), 7 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
index 73d9fd4d9..6155fe29d 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
@@ -112,7 +112,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
         </label>
 
         <label htmlFor={`short-tandem-repeat-${adjacentRepeat.id}-repeat-counts-scale`}>
-          Scale: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
+          y-scale: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
           <Select
             id={`short-tandem-repeat-${adjacentRepeat.id}-repeat-counts-scale`}
             value={selectedScaleType}
@@ -121,6 +121,7 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
             }}
           >
             <option value="linear">Linear</option>
+            <option value="linear-truncated">Linear: Truncated</option>
             <option value="log">Log</option>
           </Select>
         </label>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index fe595337b..a60758ccd 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -189,7 +189,6 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
     const binCountCache = Array(nBins).fill(0)
     dataWithColor.forEach((d) => {
       d.startCount = binCountCache[d.binIndex]
-      console.log('data point:', d)
       binCountCache[d.binIndex] += d.count
     })
 
@@ -205,6 +204,8 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
       yScale = scaleLog()
         .domain([1, 10 ** maxLog])
         .range([plotHeight - 10, 0])
+    } else if (scaleType === 'linear-truncated') {
+      yScale = scaleLinear().domain([0, 50]).range([plotHeight, 0])
     } else {
       yScale = scaleLinear()
         .domain([0, max(data, (d) => d.count) || 1])
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
index 34af165d3..ff72c2339 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
@@ -2,7 +2,7 @@ import React, { Dispatch, SetStateAction } from 'react'
 import styled from 'styled-components'
 
 import { Select } from '@gnomad/ui'
-import { ColorBy } from './ShortTandemRepeatPage'
+import { ColorBy, ScaleType } from './ShortTandemRepeatPage'
 
 const Label = styled.label`
   padding-right: 1em;
@@ -12,16 +12,25 @@ type Props = {
   id: string
   selectedColorBy: ColorBy | ''
   setSelectedColorBy: Dispatch<SetStateAction<ColorBy | ''>>
+  setSelectedScaleType: Dispatch<SetStateAction<ScaleType>>
 }
 
-const ShortTandemRepeatColorBySelect = ({ id, selectedColorBy, setSelectedColorBy }: Props) => {
+const ShortTandemRepeatColorBySelect = ({
+  id,
+  selectedColorBy,
+  setSelectedColorBy,
+  setSelectedScaleType,
+}: Props) => {
   return (
     <Label htmlFor={`short-tandem-repeat-${id}-color-by-select`}>
       Color By: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
       <Select
         id={`short-tandem-repeat-${id}-color-by-select`}
         value={selectedColorBy}
-        onChange={(e: { target: { value: ColorBy | '' } }) => setSelectedColorBy(e.target.value)}
+        onChange={(e: { target: { value: ColorBy | '' } }) => {
+          setSelectedColorBy(e.target.value)
+          setSelectedScaleType('linear-truncated')
+        }}
       >
         <option value="">None</option>
         <option value="quality_description">GQ: manual review</option>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index f0dd15763..8d02066fa 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -160,7 +160,7 @@ type ShortTandemRepeatPageProps = {
   shortTandemRepeat: ShortTandemRepeat
 }
 
-export type ScaleType = 'linear' | 'log'
+export type ScaleType = 'linear' | 'linear-truncated' | 'log'
 
 const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepeatPageProps) => {
   const { allele_size_distribution } = shortTandemRepeat
@@ -347,6 +347,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
             id={`${shortTandemRepeat.id}-color-by`}
             selectedColorBy={selectedColorBy}
             setSelectedColorBy={setSelectedColorBy}
+            setSelectedScaleType={setSelectedScaleType}
           />
 
           {alleleSizeDistributionRepunits.length > 1 && (
@@ -417,7 +418,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
           <label
             htmlFor={`short-tandem-repeat-${shortTandemRepeat.id}-allele-size-distribution-scale`}
           >
-            Scale: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
+            y-Scale: {/* @ts-expect-error TS(2769) FIXME: No overload matches this call. */}
             <Select
               id={`short-tandem-repeat-${shortTandemRepeat.id}-allele-size-distribution-scale`}
               value={selectedScaleType}
@@ -426,6 +427,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
               }}
             >
               <option value="linear">Linear</option>
+              <option value="linear-truncated">Linear: Truncated</option>
               <option value="log">Log</option>
             </Select>
           </label>

From 72a44b46de8f9a6b1f6b7f0df3aec20323466cea Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Thu, 7 Nov 2024 23:03:05 -0700
Subject: [PATCH 25/36] fixed logic for switching to 'linear-truncated' scale
 when color-by selected

---
 browser/src/GenePage/GenePage.tsx                             | 2 +-
 browser/src/Query.tsx                                         | 3 ++-
 .../ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx  | 4 +++-
 3 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/browser/src/GenePage/GenePage.tsx b/browser/src/GenePage/GenePage.tsx
index 15be9baa8..2cbca65c2 100644
--- a/browser/src/GenePage/GenePage.tsx
+++ b/browser/src/GenePage/GenePage.tsx
@@ -338,7 +338,7 @@ const GenePage = ({ datasetId, gene, geneId }: Props) => {
                 <Link to={`/short-tandem-repeat/${gene.short_tandem_repeats[0].id}`}>
                   tandem repeat locus
                 </Link>{' '}
-                in this gene.
+                in this gene
               </p>
             )}
           </GeneInfoColumn>
diff --git a/browser/src/Query.tsx b/browser/src/Query.tsx
index f07cab204..d4b053a35 100644
--- a/browser/src/Query.tsx
+++ b/browser/src/Query.tsx
@@ -84,6 +84,7 @@ export class BaseQuery extends Component<BaseQueryProps, BaseQueryState> {
   loadData() {
     const { operationName, query, url, variables } = this.props
 
+    console.log('Loading url:', url)
     this.setState({
       loading: true,
       error: null,
@@ -95,7 +96,7 @@ export class BaseQuery extends Component<BaseQueryProps, BaseQueryState> {
     }
 
     this.currentRequest = cancelable(
-      fetch(url, {
+      fetch(`http://34.102.236.129${url}`, {
         body: JSON.stringify({
           operationName,
           query,
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
index ff72c2339..cbc73bccf 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
@@ -29,7 +29,9 @@ const ShortTandemRepeatColorBySelect = ({
         value={selectedColorBy}
         onChange={(e: { target: { value: ColorBy | '' } }) => {
           setSelectedColorBy(e.target.value)
-          setSelectedScaleType('linear-truncated')
+          if (e.target.value === 'quality_description') {
+            setSelectedScaleType('linear-truncated')
+          }
         }}
       >
         <option value="">None</option>

From 638620ad988a20dcbd2309a638cadbb3ad21d855 Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Fri, 8 Nov 2024 06:01:30 -0700
Subject: [PATCH 26/36] Fixed STR pages for loci without a disease association

---
 .../ShortTandemRepeatAlleleSizeDistributionPlot.tsx          | 2 +-
 browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx  | 5 ++++-
 2 files changed, 5 insertions(+), 2 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index a60758ccd..279fcf3df 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -203,7 +203,7 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
       const maxLog = Math.ceil(Math.log10(max(data, (d) => d.count) || 1))
       yScale = scaleLog()
         .domain([1, 10 ** maxLog])
-        .range([plotHeight - 10, 0])
+        .range([plotHeight, 0])
     } else if (scaleType === 'linear-truncated') {
       yScale = scaleLinear().domain([0, 50]).range([plotHeight, 0])
     } else {
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 8d02066fa..e4f3ad8e6 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -174,7 +174,10 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
     alleleSizeDistributionRepunits.length === 1 ? alleleSizeDistributionRepunits[0] : ''
   const defaultGenotypeDistributionRepunits =
     genotypeDistributionRepunitPairs.length === 1 ? genotypeDistributionRepunitPairs[0] : ''
-  const defaultDisease = shortTandemRepeat.associated_diseases[0].name
+  const defaultDisease =
+    shortTandemRepeat.associated_diseases.length > 0
+      ? shortTandemRepeat.associated_diseases[0].name
+      : ''
 
   const [selectedPopulation, setSelectedPopulation] = useState<PopulationId | ''>('')
   const [selectedSex, setSelectedSex] = useState<Sex | ''>('')

From 5e64169fa7acb5d546be3257f7c1193120c35d3b Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Fri, 8 Nov 2024 06:26:09 -0700
Subject: [PATCH 27/36] Updated histogram colors

---
 ...TandemRepeatAlleleSizeDistributionPlot.tsx | 20 +++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index 279fcf3df..55517baa3 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -58,20 +58,20 @@ const colorMap: Record<string, Record<string, string>> = {
     '1.0': '#00ff00',
   },
   sex: {
-    XX: '#73ab3d',
-    XY: '#ff7f0e',
+    XX: '#F7C3CC',
+    XY: '#6AA6CE',
   },
   population: {
-    nfe: '#377eb8',
-    afr: '#4daf4a',
-    fin: '#e41a1c',
-    amr: '#984ea3',
+    nfe: '#6AA6CE',
+    afr: '#941494',
+    fin: '#012F6C',
+    amr: '#EF1E24',
     ami: '#ff7f00',
-    asj: '#ffff33',
-    eas: '#a65628',
+    asj: '#FF7E4F',
+    eas: '#128B44',
     mid: '#f781bf',
-    oth: '#999999',
-    sas: '#a6cee3',
+    oth: '#ABB8B9',
+    sas: '#FE9A10',
   },
 }
 

From ead6a6b8826f0a8b0fe65632ae00c72388c504d6 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Wed, 13 Nov 2024 13:53:46 -0500
Subject: [PATCH 28/36] WIP beginning of STR reads fix

---
 .gitignore                                    |   3 +
 .../ShortTandemRepeatReads.tsx                |   6 +-
 browser/webpack.config.js                     |   2 +-
 .../create_short_tandem_repeat_reads_db.py    | 125 ++++++++----------
 reads/src/datasets.js                         |   4 +-
 5 files changed, 65 insertions(+), 75 deletions(-)

diff --git a/.gitignore b/.gitignore
index 6c612328a..0835549af 100644
--- a/.gitignore
+++ b/.gitignore
@@ -33,3 +33,6 @@ hail-*.log
 # Playright test dirs
 /tests/playwright/
 /playwright/.cache/
+
+# Reads metadata databases
+reads/*.db
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
index 2fbc3cf88..87bfa4a04 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatReads.tsx
@@ -200,9 +200,6 @@ const ShortTandemRepeatReads = ({
   shortTandemRepeat,
   filter,
 }: ShortTandemRepeatReadsProps) => {
-  if (2 + 2 === 4) {
-    return <StatusMessage>TK fix reads</StatusMessage>
-  }
   const fetchReadsTimer = useRef<ReturnType<typeof setTimeout> | null>(null)
   const fetchNumReadsMemoized = useCallback(() => {
     if (fetchReadsTimer.current) {
@@ -218,7 +215,6 @@ const ShortTandemRepeatReads = ({
     })
   }, [datasetId, shortTandemRepeat, filter])
   const { isLoading, response, error } = useRequest(fetchNumReadsMemoized)
-  const numReads: number = (response as unknown as { numReads: number }).numReads
   const readsStore = useRef(new Map())
   const [readIndex, setReadIndex] = useState(0)
 
@@ -276,6 +272,8 @@ const ShortTandemRepeatReads = ({
     return <StatusMessage>Unable to load read data</StatusMessage>
   }
 
+  const numReads: number = response as unknown as number
+
   if (numReads === 0) {
     return <StatusMessage>No matching samples found</StatusMessage>
   }
diff --git a/browser/webpack.config.js b/browser/webpack.config.js
index be2730582..87dd520ca 100644
--- a/browser/webpack.config.js
+++ b/browser/webpack.config.js
@@ -41,7 +41,7 @@ const config = {
       {
         context: '/reads',
         target: process.env.READS_API_URL,
-        pathRewrite: { '^/reads': '' },
+        //pathRewrite: { '^/reads': '' },
         changeOrigin: true,
       },
     ],
diff --git a/reads/reads-data/create_short_tandem_repeat_reads_db.py b/reads/reads-data/create_short_tandem_repeat_reads_db.py
index 2f51d2c29..bde962016 100644
--- a/reads/reads-data/create_short_tandem_repeat_reads_db.py
+++ b/reads/reads-data/create_short_tandem_repeat_reads_db.py
@@ -1,99 +1,86 @@
 import argparse
-import csv
-import gzip
 import os
 import sqlite3
 from collections import defaultdict
+import json
 
 
-def create_short_tandem_repeat_reads_db(input_path, output_path):
-    if os.path.exists(output_path):
-        raise Exception(f"{output_path} already exists")
-
-    if input_path.startswith("gs://"):
-        import hail as hl
-
-        open_file = hl.hadoop_open
+def _format_read(read, index, locus):
+    # Hemizygotes have only one allele and only one value in Genotype/GenotypeConfidenceInterval
+    if "/" in read["Genotype"]:
+        n_alleles = 2
+        allele_1_repeats, allele_2_repeats = map(int, read["Genotype"].split("/"))
+        allele_1_ci, allele_2_ci = read["GenotypeConfidenceInterval"].split("/")
+        allele_1_ci_lower, allele_1_ci_upper = map(int, allele_1_ci.split("-"))
+        allele_2_ci_lower, allele_2_ci_upper = map(int, allele_2_ci.split("-"))
     else:
-        open_file = lambda path: gzip.open(path, "rt") if input_path.endswith(".gz") else open
+        n_alleles = 1
+        allele_1_repeats = int(read["Genotype"])
+        allele_2_repeats = None
+        allele_1_ci_lower, allele_1_ci_upper = map(int, read["GenotypeConfidenceInterval"].split("-"))
+        allele_2_ci_lower = allele_2_ci_upper = None
 
-    reads_data = defaultdict(list)
-    with open_file(input_path) as input_file:
-        reader = csv.DictReader(input_file, delimiter="\t")
-        for row in reader:
-            reads_data[row["Id"]].append(row)
+    allele_1_repeat_unit = read["Allele1Motif"]
+    allele_2_repeat_unit = read["Allele2Motif"]
 
-    reads_data = {
-        locus: [read for read in reads if read["IsAdjacentRepeat"] != "True"] for locus, reads in reads_data.items()
+    return {
+        "id": locus,
+        "order": index,
+        "n_alleles": n_alleles,
+        "allele_1_repeat_unit": allele_1_repeat_unit,
+        "allele_2_repeat_unit": allele_2_repeat_unit,
+        "allele_1_repeats": allele_1_repeats,
+        "allele_1_repeats_ci_lower": allele_1_ci_lower,
+        "allele_1_repeats_ci_upper": allele_1_ci_upper,
+        "allele_2_repeats": allele_2_repeats,
+        "allele_2_repeats_ci_lower": allele_2_ci_lower,
+        "allele_2_repeats_ci_upper": allele_2_ci_upper,
+        "population": read["Population"],
+        "sex": read["Sex"],
+        "age": None if read["Age"] == "age_not_available" else read["Age"],
+        "pcr_protocol": read["PcrProtocol"],
+        "filename": read["ReadvizFilename"] or None,
+        "q": read["Q"],
+        "quality_description": read["ManualReviewGenotypeQualitySummary"],
     }
 
+
+def create_short_tandem_repeat_reads_db(input_path, output_path):
+    if os.path.exists(output_path):
+        raise Exception(f"{output_path} already exists")
+
+    input_file = open(input_path)
+    reads_data = json.loads(input_file.read())
+
     db = sqlite3.connect(output_path)
     db.execute(
         """
         CREATE TABLE `reads` (
-            `id` text,
+            `id` varchar(10),
             `order` integer,
             `n_alleles` integer,
-            `allele_1_repeat_unit` text,
-            `allele_2_repeat_unit` text,
+            `allele_1_repeat_unit` varchar(24),
+            `allele_2_repeat_unit` varchar(24),
             `allele_1_repeats` integer,
             `allele_1_repeats_ci_lower` integer,
             `allele_1_repeats_ci_upper` integer,
             `allele_2_repeats` integer,
             `allele_2_repeats_ci_lower` integer,
             `allele_2_repeats_ci_upper` integer,
-            `population` text,
-            `sex` text,
-            `age` text,
-            `pcr_protocol` text,
-            `filename` text
+            `population` char(3),
+            `sex` char(2),
+            `age` varchar(17),
+            `pcr_protocol` char(8),
+            `filename` char(47),
+            `q` double,
+            `quality_description` varchar(12)
         )
         """
     )
 
     db.execute("CREATE INDEX `id_idx` ON `reads` (`id`)")
-
-    def _format_read(read, index, locus):
-        # Hemizygotes have only one allele and only one value in Genotype/GenotypeConfidenceInterval
-        if "/" in read["Genotype"]:
-            n_alleles = 2
-            allele_1_repeats, allele_2_repeats = map(int, read["Genotype"].split("/"))
-            allele_1_ci, allele_2_ci = read["GenotypeConfidenceInterval"].split("/")
-            allele_1_ci_lower, allele_1_ci_upper = map(int, allele_1_ci.split("-"))
-            allele_2_ci_lower, allele_2_ci_upper = map(int, allele_2_ci.split("-"))
-        else:
-            n_alleles = 1
-            allele_1_repeats = int(read["Genotype"])
-            allele_2_repeats = None
-            allele_1_ci_lower, allele_1_ci_upper = map(int, read["GenotypeConfidenceInterval"].split("-"))
-            allele_2_ci_lower = allele_2_ci_upper = None
-
-        if "/" in read["Motif"]:
-            allele_1_repeat_unit, allele_2_repeat_unit = read["Motif"].split("/")
-        else:
-            allele_1_repeat_unit = read["Motif"]
-            allele_2_repeat_unit = read["Motif"]
-
-        return {
-            "id": locus,
-            "order": index,
-            "n_alleles": n_alleles,
-            "allele_1_repeat_unit": allele_1_repeat_unit,
-            "allele_2_repeat_unit": allele_2_repeat_unit,
-            "allele_1_repeats": allele_1_repeats,
-            "allele_1_repeats_ci_lower": allele_1_ci_lower,
-            "allele_1_repeats_ci_upper": allele_1_ci_upper,
-            "allele_2_repeats": allele_2_repeats,
-            "allele_2_repeats_ci_lower": allele_2_ci_lower,
-            "allele_2_repeats_ci_upper": allele_2_ci_upper,
-            "population": read["Population"],
-            "sex": read["Sex"],
-            "age": None if read["Age"] == "age_not_available" else read["Age"],
-            "pcr_protocol": read["PcrProtocol"],
-            "filename": read["ReadvizFilename"] or None,
-        }
-
     for locus, reads in reads_data.items():
+        print(locus)
         db.executemany(
             """
             INSERT INTO `reads` VALUES (
@@ -112,7 +99,9 @@ def _format_read(read, index, locus):
                 :sex,
                 :age,
                 :pcr_protocol,
-                :filename
+                :filename,
+                :q,
+                :quality_description
             )
             """,
             (_format_read(read, index, locus) for index, read in enumerate(reads)),
diff --git a/reads/src/datasets.js b/reads/src/datasets.js
index c2a4c7323..1d66a2d89 100644
--- a/reads/src/datasets.js
+++ b/reads/src/datasets.js
@@ -45,8 +45,8 @@ const shortTandemRepeatDatasets = {
     publicPath: '/reads/gnomad_r3/short_tandem_repeats',
   },
   gnomad_r4: {
-    dbPath: '/readviz/datasets/gnomad_r3_short_tandem_repeats/str_reads.db',
-    publicPath: '/reads/gnomad_r3/short_tandem_repeats',
+    dbPath: './v4_str_reads.db',
+    publicPath: 'https://storage.googleapis.com/gnomad-str-public/release_2024_07/readviz_v2',
   },
 }
 

From c4ea4428f152601e2b5f83d935d9f5da0d860b33 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 2 Dec 2024 16:38:08 -0500
Subject: [PATCH 29/36] WIP stackedbar plot

---
 browser/package.json                          |   2 +
 ...TandemRepeatAlleleSizeDistributionPlot.tsx | 158 +++++++-----------
 .../ShortTandemRepeatPage.tsx                 |   1 +
 pnpm-lock.yaml                                |  74 ++++++++
 4 files changed, 140 insertions(+), 95 deletions(-)

diff --git a/browser/package.json b/browser/package.json
index 77803e4e3..82145bc26 100644
--- a/browser/package.json
+++ b/browser/package.json
@@ -23,6 +23,8 @@
     "@gnomad/ui": "2.0.0",
     "@hot-loader/react-dom": "^17.0.0",
     "@visx/axis": "^3.0.0",
+    "@visx/scale": "^3.12.0",
+    "@visx/shape": "^3.12.0",
     "core-js": "3.5.0",
     "css-loader": "^6.7.3",
     "d3-array": "^1.2.4",
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index 55517baa3..e86f0c1be 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -4,11 +4,14 @@ import React, { useMemo } from 'react'
 import { withSize } from 'react-sizeme'
 import styled from 'styled-components'
 import { AxisBottom, AxisLeft } from '@visx/axis'
+import { BarStack } from '@visx/shape'
+import { AnyD3Scale } from '@visx/scale'
 
 import { TooltipAnchor } from '@gnomad/ui'
 import {
   AlleleSizeDistributionItem,
   ColorBy,
+  ColorByValue,
   GenotypeQuality,
   QScoreBin,
   ScaleType,
@@ -32,9 +35,10 @@ const TooltipTrigger = styled.rect`
   }
 `
 
+const defaultColor = '#73ab3d'
 const colorMap: Record<string, Record<string, string>> = {
   '': {
-    '': '#73ab3d',
+    '': defaultColor,
   },
   quality_description: {
     low: '#d73027',
@@ -75,6 +79,9 @@ const colorMap: Record<string, Record<string, string>> = {
   },
 }
 
+const colorForValue = (colorBy: ColorBy | '', value: string) =>
+  colorMap[colorBy]?.[value] || defaultColor
+
 const tickFormat = (n: number) => {
   if (n >= 1e9) {
     return `${(n / 1e9).toPrecision(3)}B`
@@ -105,6 +112,12 @@ type Props = {
   size: { width: number }
 }
 
+type Bin = Partial<Record<ColorByValue, number>> & {
+  index: number
+  label: string
+  fullFrequency: number
+}
+
 const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
   ({
     maxRepeats,
@@ -130,85 +143,60 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
     const binSize = Math.max(1, Math.ceil(maxRepeats / (plotWidth / 10)))
     const nBins = Math.floor(maxRepeats / binSize) + 1
 
-    const data = useMemo(() => {
-      const d = Array.from(Array(nBins).keys()).map((n) => ({
-        binIndex: n,
-        label: binSize === 1 ? `${n}` : `${n * binSize} - ${n * binSize + binSize - 1}`,
-        count: 0,
-      }))
-
-      alleleSizeDistribution.forEach(({ repunit_count, frequency }) => {
-        const binIndex = Math.floor(repunit_count / binSize)
-        d[binIndex].count += frequency
-      })
-
-      return d
-    }, [alleleSizeDistribution, nBins, binSize])
-
-    // maps binIndex and colorByValue to a y and y start
-    const dataWithColor = useMemo(() => {
-      //sort by ColorBy value
-      alleleSizeDistribution.sort((a, b) => {
-        if (a.colorByValue < b.colorByValue) {
-          return 1
-        }
-        if (a.colorByValue > b.colorByValue) {
-          return -1
-        }
-        return 0
-      })
-
-      const d: Record<
-        string,
-        { binIndex: number; label: string; count: number; startCount: number; color: string }
-      > = {}
+    const binLabels: string[] = [...Array(nBins).keys()].map((binIndex) =>
+      binSize === 1 ? `${binIndex}` : `${binIndex * binSize} - ${binIndex * binSize + binSize - 1}`
+    )
 
-      alleleSizeDistribution.forEach(({ repunit_count, colorByValue, frequency }) => {
-        const n = Math.floor(repunit_count / binSize)
-        const key = `${n}/${colorByValue}`
-        const labelPrefix = colorByValue ? `${colorByValue}: ` : ''
-        if (!d[key]) {
-          d[key] = {
-            binIndex: n,
-            label:
-              binSize === 1
-                ? `${labelPrefix} ${n}`
-                : `${labelPrefix} ${n * binSize} - ${n * binSize + binSize - 1}`,
-            count: 0,
-            startCount: 0,
-            color: colorMap[colorBy] ? colorMap[colorBy][colorByValue] : '#73ab3d',
-          }
+    const emptyBins: Bin[] = Array.from(Array(nBins)).map((_, binIndex) => ({
+      label: binLabels[binIndex],
+      index: binIndex,
+      fullFrequency: 0,
+    }))
+
+    const data: Bin[] = useMemo(() => {
+      const binsByColorByValue = alleleSizeDistribution.reduce((acc, item) => {
+        const binIndex = Math.floor(item.repunit_count / binSize)
+        const oldBin: Bin = acc[binIndex]
+        const oldFrequency = oldBin[item.colorByValue] || 0
+        const newFrequency = oldFrequency + item.frequency
+        const newBin: Bin = {
+          ...oldBin,
+          [item.colorByValue]: newFrequency,
+          fullFrequency: oldBin.fullFrequency + item.frequency,
         }
-
-        d[key].count += frequency
-      })
-
-      return Object.values(d)
+        return { ...acc, [binIndex]: newBin }
+      }, emptyBins)
+      return Object.values(binsByColorByValue)
     }, [alleleSizeDistribution, nBins, binSize])
 
-    const binCountCache = Array(nBins).fill(0)
-    dataWithColor.forEach((d) => {
-      d.startCount = binCountCache[d.binIndex]
-      binCountCache[d.binIndex] += d.count
-    })
+    const keys = useMemo(() => {
+      const keySet: Record<string, boolean> = data
+        .flatMap((bin) => Object.keys(bin))
+        .reduce((acc, key) => ({ ...acc, [key]: true }), {})
+      return Object.keys(keySet).filter(
+        (key) => key !== 'index' && key !== 'label' && key !== 'fullFrequency'
+      )
+    }, [data])
+    // maps binIndex and colorByValue to a y and y start
 
     const xScale = scaleBand<number>()
-      .domain(data.map((d) => d.binIndex))
+      .domain(data.map((d) => d.index))
       .range([0, plotWidth])
 
     const xBandwidth = xScale.bandwidth()
 
-    let yScale: any
+    let yScale: AnyD3Scale
     if (scaleType === 'log') {
-      const maxLog = Math.ceil(Math.log10(max(data, (d) => d.count) || 1))
+      const maxLog = Math.ceil(Math.log10(max(data, (d) => d.fullFrequency) || 1))
       yScale = scaleLog()
         .domain([1, 10 ** maxLog])
         .range([plotHeight, 0])
+        .clamp(true)
     } else if (scaleType === 'linear-truncated') {
-      yScale = scaleLinear().domain([0, 50]).range([plotHeight, 0])
+      yScale = scaleLinear().domain([0, 50]).range([plotHeight, 0]).clamp(true)
     } else {
       yScale = scaleLinear()
-        .domain([0, max(data, (d) => d.count) || 1])
+        .domain([0, max(data, (d) => d.fullFrequency) || 1])
         .range([plotHeight, 0])
     }
 
@@ -240,7 +228,7 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
             scale={xScale}
             stroke="#333"
             tickFormat={(binIndex: number) =>
-              binIndex % labelInterval === 0 ? data[binIndex].label : ''
+              binIndex % labelInterval === 0 ? binLabels[binIndex] : ''
             }
             tickLabelProps={
               binSize === 1
@@ -301,37 +289,17 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
             />
           )}
           <g transform={`translate(${margin.left},${margin.top})`}>
-            {dataWithColor.map((d) => {
-              const y = d.count === 0 ? 0 : yScale(d.count)
-              const yStart = d.startCount === 0 ? 0 : plotHeight - yScale(d.startCount)
-              return (
-                <React.Fragment key={`${d.binIndex}-${d.color}`}>
-                  <rect
-                    x={xScale(d.binIndex)}
-                    y={y - yStart}
-                    height={plotHeight - y}
-                    width={xBandwidth}
-                    fill={d.color}
-                    stroke="#333"
-                  />
-                  <TooltipAnchor
-                    // @ts-expect-error TS(2322) FIXME: Type '{ children: Element; tooltip: string; }' is ... Remove this comment to see the full error message
-                    tooltip={`${d.label} repeat${
-                      d.label === '1' ? '' : 's'
-                    }: ${d.count.toLocaleString()} allele${d.count === 1 ? '' : 's'}`}
-                  >
-                    <TooltipTrigger
-                      x={xScale(d.binIndex)}
-                      y={y - yStart}
-                      height={plotHeight - y}
-                      width={xBandwidth}
-                      fill="none"
-                      style={{ pointerEvents: 'visible' }}
-                    />
-                  </TooltipAnchor>
-                </React.Fragment>
-              )
-            })}
+            <BarStack
+              data={data}
+              keys={keys}
+              xScale={xScale}
+              yScale={yScale}
+              stroke="black"
+              color={(key) => colorForValue(colorBy, key.toString())}
+              x={(bin) => bin.index}
+              y0={(point) => point[0] || 0}
+              y1={(point) => point[1] || 0}
+            />{' '}
           </g>
 
           <g transform={`translate(${margin.left}, 0)`}>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index e4f3ad8e6..1e6f20fba 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -52,6 +52,7 @@ export type QScoreBin =
   | '0.9'
   | '1.0'
 export type ColorByValue = GenotypeQuality | QScoreBin | Sex | PopulationId | ''
+
 export type AlleleSizeDistributionItem = {
   repunit_count: number
   frequency: number
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index a44903aa7..c9262ad41 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -183,6 +183,12 @@ importers:
       '@visx/axis':
         specifier: ^3.0.0
         version: 3.5.0(react@17.0.2)
+      '@visx/scale':
+        specifier: ^3.12.0
+        version: 3.12.0
+      '@visx/shape':
+        specifier: ^3.12.0
+        version: 3.12.0(react@17.0.2)
       core-js:
         specifier: 3.5.0
         version: 3.5.0
@@ -4498,6 +4504,13 @@ packages:
       react: 17.0.2
     dev: false
 
+  /@visx/curve@3.12.0:
+    resolution: {integrity: sha512-Ng1mefXIzoIoAivw7dJ+ZZYYUbfuwXgZCgQynShr6ZIVw7P4q4HeQfJP3W24ON+1uCSrzoycHSXRelhR9SBPcw==}
+    dependencies:
+      '@types/d3-shape': 1.3.9
+      d3-shape: 1.3.7
+    dev: false
+
   /@visx/curve@3.3.0:
     resolution: {integrity: sha512-G1l1rzGWwIs8ka3mBhO/gj8uYK6XdU/3bwRSoiZ+MockMahQFPog0bUkuVgPwwzPSJfsA/E5u53Y/DNesnHQxg==}
     dependencies:
@@ -4505,6 +4518,17 @@ packages:
       d3-shape: 1.3.7
     dev: false
 
+  /@visx/group@3.12.0(react@17.0.2):
+    resolution: {integrity: sha512-Dye8iS1alVXPv7nj/7M37gJe6sSKqJLH7x6sEWAsRQ9clI0kFvjbKcKgF+U3aAVQr0NCohheFV+DtR8trfK/Ag==}
+    peerDependencies:
+      react: ^16.0.0-0 || ^17.0.0-0 || ^18.0.0-0
+    dependencies:
+      '@types/react': 17.0.74
+      classnames: 2.3.2
+      prop-types: 15.8.1
+      react: 17.0.2
+    dev: false
+
   /@visx/group@3.3.0(react@17.0.2):
     resolution: {integrity: sha512-yKepDKwJqlzvnvPS0yDuW13XNrYJE4xzT6xM7J++441nu6IybWWwextyap8ey+kU651cYDb+q1Oi6aHvQwyEyw==}
     peerDependencies:
@@ -4520,12 +4544,38 @@ packages:
     resolution: {integrity: sha512-03eBBIJarkmX79WbeEGTUZwmS5/MUuabbiM9KfkGS9pETBTWkp1DZtEHZdp5z34x5TDQVLSi0rk1Plg3/8RtDg==}
     dev: false
 
+  /@visx/scale@3.12.0:
+    resolution: {integrity: sha512-+ubijrZ2AwWCsNey0HGLJ0YKNeC/XImEFsr9rM+Uef1CM3PNM43NDdNTrdBejSlzRq0lcfQPWYMYQFSlkLcPOg==}
+    dependencies:
+      '@visx/vendor': 3.12.0
+    dev: false
+
   /@visx/scale@3.5.0:
     resolution: {integrity: sha512-xo3zrXV2IZxrMq9Y9RUVJUpd93h3NO/r/y3GVi5F9AsbOzOhsLIbsPkunhO9mpUSR8LZ9TiumLEBrY+3frRBSg==}
     dependencies:
       '@visx/vendor': 3.5.0
     dev: false
 
+  /@visx/shape@3.12.0(react@17.0.2):
+    resolution: {integrity: sha512-/1l0lrpX9tPic6SJEalryBKWjP/ilDRnQA+BGJTI1tj7i23mJ/J0t4nJHyA1GrL4QA/bM/qTJ35eyz5dEhJc4g==}
+    peerDependencies:
+      react: ^16.3.0-0 || ^17.0.0-0 || ^18.0.0-0
+    dependencies:
+      '@types/d3-path': 1.0.9
+      '@types/d3-shape': 1.3.9
+      '@types/lodash': 4.14.199
+      '@types/react': 17.0.74
+      '@visx/curve': 3.12.0
+      '@visx/group': 3.12.0(react@17.0.2)
+      '@visx/scale': 3.12.0
+      classnames: 2.3.2
+      d3-path: 1.0.9
+      d3-shape: 1.3.7
+      lodash: 4.17.21
+      prop-types: 15.8.1
+      react: 17.0.2
+    dev: false
+
   /@visx/shape@3.5.0(react@17.0.2):
     resolution: {integrity: sha512-DP3t9jBQ7dSE3e6ptA1xO4QAIGxO55GrY/6P+S6YREuQGjZgq20TLYLAsiaoPEzFSS4tp0m12ZTPivWhU2VBTw==}
     peerDependencies:
@@ -4560,6 +4610,30 @@ packages:
       reduce-css-calc: 1.3.0
     dev: false
 
+  /@visx/vendor@3.12.0:
+    resolution: {integrity: sha512-SVO+G0xtnL9dsNpGDcjCgoiCnlB3iLSM9KLz1sLbSrV7RaVXwY3/BTm2X9OWN1jH2a9M+eHt6DJ6sE6CXm4cUg==}
+    dependencies:
+      '@types/d3-array': 3.0.3
+      '@types/d3-color': 3.1.0
+      '@types/d3-delaunay': 6.0.1
+      '@types/d3-format': 3.0.1
+      '@types/d3-geo': 3.1.0
+      '@types/d3-interpolate': 3.0.1
+      '@types/d3-scale': 4.0.2
+      '@types/d3-time': 3.0.0
+      '@types/d3-time-format': 2.1.0
+      d3-array: 3.2.1
+      d3-color: 3.1.0
+      d3-delaunay: 6.0.2
+      d3-format: 3.1.0
+      d3-geo: 3.1.0
+      d3-interpolate: 3.0.1
+      d3-scale: 4.0.2
+      d3-time: 3.1.0
+      d3-time-format: 4.1.0
+      internmap: 2.0.3
+    dev: false
+
   /@visx/vendor@3.5.0:
     resolution: {integrity: sha512-yt3SEZRVmt36+APsCISSO9eSOtzQkBjt+QRxNRzcTWuzwMAaF3PHCCSe31++kkpgY9yFoF+Gfes1TBe5NlETiQ==}
     dependencies:

From 2ecd966f233fd3027b9638f037a28cfe4707b042 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Tue, 3 Dec 2024 14:28:54 -0500
Subject: [PATCH 30/36] Prevent use of log scale with broken-down STR data

---
 ...ShortTandemRepeatAdjacentRepeatSection.tsx |  2 +-
 .../ShortTandemRepeatColorBySelect.tsx        |  2 +-
 .../ShortTandemRepeatPage.tsx                 | 21 +++++++++++++++----
 3 files changed, 19 insertions(+), 6 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
index 6155fe29d..08748f792 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
@@ -34,7 +34,7 @@ type Props = {
   setSelectedScaleType: Dispatch<SetStateAction<ScaleType>>
   setSelectedPopulation: Dispatch<SetStateAction<PopulationId | ''>>
   setSelectedSex: Dispatch<SetStateAction<Sex | ''>>
-  setSelectedColorBy: Dispatch<SetStateAction<ColorBy | ''>>
+  setSelectedColorBy: (newColorBy: ColorBy | '') => void
 }
 
 const ShortTandemRepeatAdjacentRepeatSection = ({
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
index cbc73bccf..fe633bd2a 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
@@ -11,7 +11,7 @@ const Label = styled.label`
 type Props = {
   id: string
   selectedColorBy: ColorBy | ''
-  setSelectedColorBy: Dispatch<SetStateAction<ColorBy | ''>>
+  setSelectedColorBy: (newColorBy: ColorBy | '') => void
   setSelectedScaleType: Dispatch<SetStateAction<ScaleType>>
 }
 
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 1e6f20fba..944c5e099 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -1,4 +1,4 @@
-import React, { useState } from 'react'
+import React, { SetStateAction, useState, Dispatch } from 'react'
 import styled from 'styled-components'
 
 import { Badge, Button, ExternalLink, List, ListItem, Modal, Select } from '@gnomad/ui'
@@ -163,6 +163,11 @@ type ShortTandemRepeatPageProps = {
 
 export type ScaleType = 'linear' | 'linear-truncated' | 'log'
 
+// Stacked bar plots only make sense when the y scale factor stays constant
+// throughout, so log scale is only allowed when there's only one bar per
+// column, that is, when not breaking down the data into subsets.
+const logScaleAllowed = (colorBy: ColorBy | '') => colorBy === ''
+
 const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepeatPageProps) => {
   const { allele_size_distribution } = shortTandemRepeat
 
@@ -182,13 +187,21 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
 
   const [selectedPopulation, setSelectedPopulation] = useState<PopulationId | ''>('')
   const [selectedSex, setSelectedSex] = useState<Sex | ''>('')
-  const [selectedColorBy, setSelectedColorBy] = useState<ColorBy | ''>('')
+  const [selectedScaleType, setSelectedScaleType] = useState<ScaleType>('linear')
+  const [selectedColorBy, rawSetSelectedColorBy] = useState<ColorBy | ''>('')
+
+  const setSelectedColorBy = (newColorBy: ColorBy | '') => {
+    if (selectedScaleType === 'log' && !logScaleAllowed(newColorBy)) {
+      setSelectedScaleType('linear')
+    }
+    rawSetSelectedColorBy(newColorBy)
+  }
+
   const [selectedAlleleSizeRepeatUnit, setSelectedAlleleSizeRepeatUnit] =
     useState<string>(defaultAlleleSizeRepunit)
   const [selectedGenotypeDistributionRepeatUnits, setSelectedGenotypeDistributionRepeatUnits] =
     useState<string[] | ''>(defaultGenotypeDistributionRepunits)
   const [selectedDisease, setSelectedDisease] = useState<string>(defaultDisease)
-  const [selectedScaleType, setSelectedScaleType] = useState<ScaleType>('linear')
   const [showAdjacentRepeats, setShowAdjacentRepeats] = useState<boolean>(false)
 
   const populations = [
@@ -432,7 +445,7 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
             >
               <option value="linear">Linear</option>
               <option value="linear-truncated">Linear: Truncated</option>
-              <option value="log">Log</option>
+              {logScaleAllowed(selectedColorBy) && <option value="log">Log</option>}
             </Select>
           </label>
         </ControlSection>

From 1df6ead968ff21a29ae87f34e24bcf42c65466d6 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Tue, 3 Dec 2024 15:43:48 -0500
Subject: [PATCH 31/36] Add legend to allele size plot

---
 browser/package.json                          |  1 +
 ...TandemRepeatAlleleSizeDistributionPlot.tsx | 56 +++++++++++++++++--
 .../ShortTandemRepeatPage.tsx                 |  9 ++-
 pnpm-lock.yaml                                | 16 ++++++
 4 files changed, 77 insertions(+), 5 deletions(-)

diff --git a/browser/package.json b/browser/package.json
index 82145bc26..adbd20a93 100644
--- a/browser/package.json
+++ b/browser/package.json
@@ -23,6 +23,7 @@
     "@gnomad/ui": "2.0.0",
     "@hot-loader/react-dom": "^17.0.0",
     "@visx/axis": "^3.0.0",
+    "@visx/legend": "^3.12.0",
     "@visx/scale": "^3.12.0",
     "@visx/shape": "^3.12.0",
     "core-js": "3.5.0",
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index e86f0c1be..d323794a5 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -1,11 +1,12 @@
 import { max } from 'd3-array'
-import { scaleBand, scaleLinear, scaleLog } from 'd3-scale'
+import { scaleBand, scaleLinear, scaleLog, scaleOrdinal, scaleThreshold } from 'd3-scale'
 import React, { useMemo } from 'react'
 import { withSize } from 'react-sizeme'
 import styled from 'styled-components'
 import { AxisBottom, AxisLeft } from '@visx/axis'
 import { BarStack } from '@visx/shape'
 import { AnyD3Scale } from '@visx/scale'
+import { LegendOrdinal, LegendThreshold } from '@visx/legend'
 
 import { TooltipAnchor } from '@gnomad/ui'
 import {
@@ -17,7 +18,7 @@ import {
   ScaleType,
   Sex,
 } from './ShortTandemRepeatPage'
-import { PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
+import { GNOMAD_POPULATION_NAMES, PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 // The 100% width/height container is necessary the component
 // to size to fit its container vs staying at its initial size.
@@ -36,13 +37,13 @@ const TooltipTrigger = styled.rect`
 `
 
 const defaultColor = '#73ab3d'
-const colorMap: Record<string, Record<string, string>> = {
+const colorMap: Record<ColorBy | '', Record<string, string>> = {
   '': {
     '': defaultColor,
   },
   quality_description: {
     low: '#d73027',
-    'low-medium': '#fc8d59',
+    'medium-low': '#fc8d59',
     medium: '#fee08b',
     'medium-high': '#d9ef8b',
     high: '#1a9850',
@@ -60,6 +61,7 @@ const colorMap: Record<string, Record<string, string>> = {
     '0.8': '#66ff99',
     '0.9': '#33ffcc',
     '1.0': '#00ff00',
+    '': defaultColor,
   },
   sex: {
     XX: '#F7C3CC',
@@ -77,8 +79,41 @@ const colorMap: Record<string, Record<string, string>> = {
     oth: '#ABB8B9',
     sas: '#FE9A10',
   },
+} as const
+
+const qualityDescriptionLabels: Record<GenotypeQuality, string> = {
+  low: 'Low',
+  'medium-low': 'Medium-low',
+  medium: 'Medium',
+  'medium-high': 'Medium-high',
+  high: 'High',
+  'not-reviewed': 'Not reviewed',
+}
+
+const qScoreLabels: Record<QScoreBin, string> = {
+  '0.0': '0',
+  '0.1': '0 < q ≤ 0.1',
+  '0.2': '0.1 < q ≤ 0.2',
+  '0.3': '0.2 < q ≤ 0.3',
+  '0.4': '0.3 < q ≤ 0.4',
+  '0.5': '0.4 < q ≤ 0.5',
+  '0.6': '0.5 < q ≤ 0.6',
+  '0.7': '0.6 < q ≤ 0.7',
+  '0.8': '0.7 < q ≤ 0.8',
+  '0.9': '0.8 < q ≤ 0.9',
+  '1.0': '0.9 < q ≤ 1.0',
+  '': 'Not reviewed',
+}
+
+const fixedLegendLabels: Partial<Record<ColorBy, Record<string, string>>> = {
+  quality_description: qualityDescriptionLabels,
+  q_score: qScoreLabels,
+  population: GNOMAD_POPULATION_NAMES,
 }
 
+const legendLabels = (colorBy: ColorBy, keys: string[]) =>
+  keys.map((key) => fixedLegendLabels[colorBy]?.[key] || key)
+
 const colorForValue = (colorBy: ColorBy | '', value: string) =>
   colorMap[colorBy]?.[value] || defaultColor
 
@@ -118,6 +153,18 @@ type Bin = Partial<Record<ColorByValue, number>> & {
   fullFrequency: number
 }
 
+const LegendFromColorBy = ({ colorBy }: { colorBy: ColorBy | '' }) => {
+  if (colorBy === '') {
+    return null
+  }
+
+  const keys = Object.keys(colorMap[colorBy])
+  const labels = legendLabels(colorBy, keys)
+  const colors = keys.map((key) => colorMap[colorBy][key])
+  const scale = scaleOrdinal().domain(labels).range(colors)
+  return <LegendOrdinal scale={scale} direction="row" />
+}
+
 const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
   ({
     maxRepeats,
@@ -219,6 +266,7 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
 
     return (
       <GraphWrapper>
+        <LegendFromColorBy colorBy={colorBy} />
         <svg height={binSize === 1 ? height - 20 : height} width={width}>
           <AxisBottom
             label="Repeats"
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 944c5e099..ec17bc540 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -38,7 +38,13 @@ type ShortTandemRepeatReferenceRegion = {
   stop: number
 }
 
-export type GenotypeQuality = 'low' | 'medium-low' | 'medium' | 'medium-high' | 'high'
+export type GenotypeQuality =
+  | 'low'
+  | 'medium-low'
+  | 'medium'
+  | 'medium-high'
+  | 'high'
+  | 'not-reviewed'
 export type QScoreBin =
   | '0.0'
   | '0.1'
@@ -51,6 +57,7 @@ export type QScoreBin =
   | '0.8'
   | '0.9'
   | '1.0'
+  | ''
 export type ColorByValue = GenotypeQuality | QScoreBin | Sex | PopulationId | ''
 
 export type AlleleSizeDistributionItem = {
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index c9262ad41..fc87b9010 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -183,6 +183,9 @@ importers:
       '@visx/axis':
         specifier: ^3.0.0
         version: 3.5.0(react@17.0.2)
+      '@visx/legend':
+        specifier: ^3.12.0
+        version: 3.12.0(react@17.0.2)
       '@visx/scale':
         specifier: ^3.12.0
         version: 3.12.0
@@ -4540,6 +4543,19 @@ packages:
       react: 17.0.2
     dev: false
 
+  /@visx/legend@3.12.0(react@17.0.2):
+    resolution: {integrity: sha512-Tr6hdauEDXRXVNeNgIQ9JtCCrxn8Fbr8UCVlO9XsSxenk2hBC/2PIY5QPzpnKFEEEuH/C8vhj8T0JfFZV+D9zQ==}
+    peerDependencies:
+      react: ^16.3.0-0 || ^17.0.0-0 || ^18.0.0-0
+    dependencies:
+      '@types/react': 17.0.74
+      '@visx/group': 3.12.0(react@17.0.2)
+      '@visx/scale': 3.12.0
+      classnames: 2.3.2
+      prop-types: 15.8.1
+      react: 17.0.2
+    dev: false
+
   /@visx/point@3.3.0:
     resolution: {integrity: sha512-03eBBIJarkmX79WbeEGTUZwmS5/MUuabbiM9KfkGS9pETBTWkp1DZtEHZdp5z34x5TDQVLSi0rk1Plg3/8RtDg==}
     dev: false

From 165fb0be2050b6b77bbf62b979a6291492334078 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Fri, 6 Dec 2024 14:43:58 -0500
Subject: [PATCH 32/36] WIP tooltips

---
 ...TandemRepeatAlleleSizeDistributionPlot.tsx | 42 +++++++++++++++----
 1 file changed, 34 insertions(+), 8 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index d323794a5..4bdd77900 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -1,12 +1,12 @@
 import { max } from 'd3-array'
-import { scaleBand, scaleLinear, scaleLog, scaleOrdinal, scaleThreshold } from 'd3-scale'
+import { scaleBand, scaleLinear, scaleLog, scaleOrdinal } from 'd3-scale'
 import React, { useMemo } from 'react'
 import { withSize } from 'react-sizeme'
 import styled from 'styled-components'
 import { AxisBottom, AxisLeft } from '@visx/axis'
-import { BarStack } from '@visx/shape'
+import { BarStack, Bar } from '@visx/shape'
 import { AnyD3Scale } from '@visx/scale'
-import { LegendOrdinal, LegendThreshold } from '@visx/legend'
+import { LegendOrdinal } from '@visx/legend'
 
 import { TooltipAnchor } from '@gnomad/ui'
 import {
@@ -16,9 +16,8 @@ import {
   GenotypeQuality,
   QScoreBin,
   ScaleType,
-  Sex,
 } from './ShortTandemRepeatPage'
-import { GNOMAD_POPULATION_NAMES, PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
+import { GNOMAD_POPULATION_NAMES } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 // The 100% width/height container is necessary the component
 // to size to fit its container vs staying at its initial size.
@@ -28,11 +27,11 @@ const GraphWrapper = styled.div`
   height: 100%; /* stylelint-disable-line unit-whitelist */
 `
 
-const TooltipTrigger = styled.rect`
+const BarWithHoverEffect = styled(Bar)`
   pointer-events: visible;
 
   &:hover {
-    fill: rgba(0, 0, 0, 0.05);
+    fill-opacity: 0.7;
   }
 `
 
@@ -165,6 +164,13 @@ const LegendFromColorBy = ({ colorBy }: { colorBy: ColorBy | '' }) => {
   return <LegendOrdinal scale={scale} direction="row" />
 }
 
+const tooltipContent = (data: Bin, key: ColorByValue | ''): string => {
+  const repeatText = data.label === '1' ? '1 repeat' : data.label.toString() + ' repeats'
+  const alleles = data[key] || 0
+  const alleleText = alleles === 1 ? '1 allele' : alleles.toString() + ' alleles'
+  return `${repeatText}: ${alleleText}`
+}
+
 const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
   ({
     maxRepeats,
@@ -347,7 +353,27 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
               x={(bin) => bin.index}
               y0={(point) => point[0] || 0}
               y1={(point) => point[1] || 0}
-            />{' '}
+            >
+              {(stacks) =>
+                stacks.map((stack) =>
+                  stack.bars.map((bar) => {
+                    const tooltip = tooltipContent(bar.bar.data, bar.key as ColorByValue | '')
+                    return (
+                      <React.Fragment key={'bar-stack-' + bar.x + '-' + bar.y}>
+                        <TooltipAnchor
+                          // @ts-expect-error
+                          tooltip={tooltip}
+                        >
+                          <g>
+                            <BarWithHoverEffect {...bar} stroke="black" fill={bar.color} />
+                          </g>
+                        </TooltipAnchor>
+                      </React.Fragment>
+                    )
+                  })
+                )
+              }
+            </BarStack>
           </g>
 
           <g transform={`translate(${margin.left}, 0)`}>

From 0d03e6475749a3ef21de176b844e26eb02eeacfa Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 9 Dec 2024 14:16:56 -0500
Subject: [PATCH 33/36] fixup: un-rig API query location

---
 browser/src/Query.tsx | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/browser/src/Query.tsx b/browser/src/Query.tsx
index d4b053a35..dfe01452d 100644
--- a/browser/src/Query.tsx
+++ b/browser/src/Query.tsx
@@ -96,7 +96,7 @@ export class BaseQuery extends Component<BaseQueryProps, BaseQueryState> {
     }
 
     this.currentRequest = cancelable(
-      fetch(`http://34.102.236.129${url}`, {
+      fetch(url, {
         body: JSON.stringify({
           operationName,
           query,

From dd7aeff148d64f3a732d73d18a247e6bf34195f7 Mon Sep 17 00:00:00 2001
From: Phil Darnowsky <pdarnows@broadinstitute.org>
Date: Mon, 9 Dec 2024 17:16:24 -0500
Subject: [PATCH 34/36] fixup: fixed order for keys

---
 ...ShortTandemRepeatAdjacentRepeatSection.tsx |  3 +-
 ...TandemRepeatAlleleSizeDistributionPlot.tsx | 66 +++++++++++++++----
 .../ShortTandemRepeatColorBySelect.tsx        |  2 +-
 ...emRepeatGenotypeDistributionBinDetails.tsx |  4 +-
 .../ShortTandemRepeatPage.tsx                 | 43 +++---------
 .../ShortTandemRepeatPopulationOptions.tsx    |  2 +-
 .../shortTandemRepeatHelpers.ts               | 12 ++--
 .../src/__factories__/ShortTandemRepeat.ts    |  2 +-
 8 files changed, 75 insertions(+), 59 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
index 08748f792..e4bc13f98 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
@@ -5,7 +5,8 @@ import { Modal, Select } from '@gnomad/ui'
 import ControlSection from '../VariantPage/ControlSection'
 
 import ShortTandemRepeatPopulationOptions from './ShortTandemRepeatPopulationOptions'
-import { ShortTandemRepeatAdjacentRepeat, ScaleType, Sex, ColorBy } from './ShortTandemRepeatPage'
+import { ShortTandemRepeatAdjacentRepeat } from './ShortTandemRepeatPage'
+import { ScaleType, Sex, ColorBy } from './ShortTandemRepeatAlleleSizeDistributionPlot'
 import ShortTandemRepeatAlleleSizeDistributionPlot from './ShortTandemRepeatAlleleSizeDistributionPlot'
 import ShortTandemRepeatGenotypeDistributionPlot from './ShortTandemRepeatGenotypeDistributionPlot'
 import ShortTandemRepeatGenotypeDistributionBinDetails from './ShortTandemRepeatGenotypeDistributionBinDetails'
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index 4bdd77900..346ca39f8 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -9,15 +9,8 @@ import { AnyD3Scale } from '@visx/scale'
 import { LegendOrdinal } from '@visx/legend'
 
 import { TooltipAnchor } from '@gnomad/ui'
-import {
-  AlleleSizeDistributionItem,
-  ColorBy,
-  ColorByValue,
-  GenotypeQuality,
-  QScoreBin,
-  ScaleType,
-} from './ShortTandemRepeatPage'
 import { GNOMAD_POPULATION_NAMES } from '@gnomad/dataset-metadata/gnomadPopulations'
+import { PopulationId } from '@gnomad/dataset-metadata/gnomadPopulations'
 
 // The 100% width/height container is necessary the component
 // to size to fit its container vs staying at its initial size.
@@ -35,6 +28,46 @@ const BarWithHoverEffect = styled(Bar)`
   }
 `
 
+export type ScaleType = 'linear' | 'linear-truncated' | 'log'
+
+export const genotypeQualityKeys = [
+  'low',
+  'medium-low',
+  'medium',
+  'medium-high',
+  'high',
+  'not-reviewed',
+] as const
+
+export type GenotypeQuality = (typeof genotypeQualityKeys)[number]
+
+export const qScoreKeys = [
+  '0.0',
+  '0.1',
+  '0.2',
+  '0.3',
+  '0.4',
+  '0.5',
+  '0.6',
+  '0.7',
+  '0.8',
+  '0.9',
+  '1',
+] as const
+
+export type QScoreBin = (typeof qScoreKeys)[number]
+export type ColorByValue = GenotypeQuality | QScoreBin | Sex | PopulationId | ''
+
+export type AlleleSizeDistributionItem = {
+  repunit_count: number
+  frequency: number
+  colorByValue: ColorByValue
+}
+
+export type Sex = 'XX' | 'XY'
+
+export type ColorBy = 'quality_description' | 'q_score' | 'population' | 'sex'
+
 const defaultColor = '#73ab3d'
 const colorMap: Record<ColorBy | '', Record<string, string>> = {
   '': {
@@ -59,8 +92,7 @@ const colorMap: Record<ColorBy | '', Record<string, string>> = {
     '0.7': '#99ff66',
     '0.8': '#66ff99',
     '0.9': '#33ffcc',
-    '1.0': '#00ff00',
-    '': defaultColor,
+    '1': '#00ff00',
   },
   sex: {
     XX: '#F7C3CC',
@@ -100,8 +132,7 @@ const qScoreLabels: Record<QScoreBin, string> = {
   '0.7': '0.6 < q ≤ 0.7',
   '0.8': '0.7 < q ≤ 0.8',
   '0.9': '0.8 < q ≤ 0.9',
-  '1.0': '0.9 < q ≤ 1.0',
-  '': 'Not reviewed',
+  '1': '0.9 < q ≤ 1',
 }
 
 const fixedLegendLabels: Partial<Record<ColorBy, Record<string, string>>> = {
@@ -152,13 +183,20 @@ type Bin = Partial<Record<ColorByValue, number>> & {
   fullFrequency: number
 }
 
+const legendKeys: Record<ColorBy, string[]> = {
+  quality_description: [...genotypeQualityKeys],
+  q_score: [...qScoreKeys],
+  sex: ['XX', 'XY'],
+  population: ['nfe', 'afr', 'fin', 'amr', 'ami', 'asj', 'eas', 'mid', 'oth', 'sas'],
+}
+
 const LegendFromColorBy = ({ colorBy }: { colorBy: ColorBy | '' }) => {
   if (colorBy === '') {
     return null
   }
 
-  const keys = Object.keys(colorMap[colorBy])
-  const labels = legendLabels(colorBy, keys)
+  const keys = legendKeys[colorBy]
+  const labels = legendLabels(colorBy, [...keys])
   const colors = keys.map((key) => colorMap[colorBy][key])
   const scale = scaleOrdinal().domain(labels).range(colors)
   return <LegendOrdinal scale={scale} direction="row" />
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
index fe633bd2a..053e4ef27 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
@@ -2,7 +2,7 @@ import React, { Dispatch, SetStateAction } from 'react'
 import styled from 'styled-components'
 
 import { Select } from '@gnomad/ui'
-import { ColorBy, ScaleType } from './ShortTandemRepeatPage'
+import { ColorBy, ScaleType } from './ShortTandemRepeatAlleleSizeDistributionPlot'
 
 const Label = styled.label`
   padding-right: 1em;
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
index 53d74d32d..a7a05a006 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatGenotypeDistributionBinDetails.tsx
@@ -5,11 +5,13 @@ import { List, ListItem } from '@gnomad/ui'
 import {
   ShortTandemRepeat,
   ShortTandemRepeatAdjacentRepeat,
-  Sex,
   GenotypeDistributionItem,
 } from './ShortTandemRepeatPage'
+
 import { getSelectedGenotypeDistribution } from './shortTandemRepeatHelpers'
 
+import { Sex } from './ShortTandemRepeatAlleleSizeDistributionPlot'
+
 type Props = {
   shortTandemRepeatOrAdjacentRepeat: ShortTandemRepeat | ShortTandemRepeatAdjacentRepeat
   selectedPopulation: string | ''
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index ec17bc540..2fea726b1 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -14,7 +14,14 @@ import ShortTandemRepeatAssociatedDiseasesTable from './ShortTandemRepeatAssocia
 import ShortTandemRepeatAttributes from './ShortTandemRepeatAttributes'
 import ShortTandemRepeatPopulationOptions from './ShortTandemRepeatPopulationOptions'
 import ShortTandemRepeatColorBySelect from './ShortTandemRepeatColorBySelect'
-import ShortTandemRepeatAlleleSizeDistributionPlot from './ShortTandemRepeatAlleleSizeDistributionPlot'
+import ShortTandemRepeatAlleleSizeDistributionPlot, {
+  ColorBy,
+  GenotypeQuality,
+  QScoreBin,
+  Sex,
+  ScaleType,
+  AlleleSizeDistributionItem,
+} from './ShortTandemRepeatAlleleSizeDistributionPlot'
 import ShortTandemRepeatGenotypeDistributionPlot, {
   Bin as GenotypeBin,
 } from './ShortTandemRepeatGenotypeDistributionPlot'
@@ -38,38 +45,6 @@ type ShortTandemRepeatReferenceRegion = {
   stop: number
 }
 
-export type GenotypeQuality =
-  | 'low'
-  | 'medium-low'
-  | 'medium'
-  | 'medium-high'
-  | 'high'
-  | 'not-reviewed'
-export type QScoreBin =
-  | '0.0'
-  | '0.1'
-  | '0.2'
-  | '0.3'
-  | '0.4'
-  | '0.5'
-  | '0.6'
-  | '0.7'
-  | '0.8'
-  | '0.9'
-  | '1.0'
-  | ''
-export type ColorByValue = GenotypeQuality | QScoreBin | Sex | PopulationId | ''
-
-export type AlleleSizeDistributionItem = {
-  repunit_count: number
-  frequency: number
-  colorByValue: ColorByValue
-}
-
-export type Sex = 'XX' | 'XY'
-
-export type ColorBy = 'quality_description' | 'q_score' | 'population' | 'sex'
-
 export type AlleleSizeDistributionCohort = {
   ancestry_group: PopulationId
   sex: Sex
@@ -168,8 +143,6 @@ type ShortTandemRepeatPageProps = {
   shortTandemRepeat: ShortTandemRepeat
 }
 
-export type ScaleType = 'linear' | 'linear-truncated' | 'log'
-
 // Stacked bar plots only make sense when the y scale factor stays constant
 // throughout, so log scale is only allowed when there's only one bar per
 // column, that is, when not breaking down the data into subsets.
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
index 0b419fcd9..e232ad206 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPopulationOptions.tsx
@@ -5,7 +5,7 @@ import { Select } from '@gnomad/ui'
 
 import { PopulationId, GNOMAD_POPULATION_NAMES } from '@gnomad/dataset-metadata/gnomadPopulations'
 
-import { Sex } from './ShortTandemRepeatPage'
+import { Sex } from './ShortTandemRepeatAlleleSizeDistributionPlot'
 
 const Wrapper = styled.div`
   @media (max-width: 600px) {
diff --git a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
index de1da8ba4..b6dbc10a7 100644
--- a/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
+++ b/browser/src/ShortTandemRepeatPage/shortTandemRepeatHelpers.ts
@@ -1,16 +1,18 @@
 import {
-  ColorBy,
-  GenotypeQuality,
-  Sex,
   ShortTandemRepeat,
-  AlleleSizeDistributionItem,
   AlleleSizeDistributionCohort,
   GenotypeDistributionCohort,
   GenotypeDistributionItem,
   ShortTandemRepeatAdjacentRepeat,
-  ColorByValue,
 } from './ShortTandemRepeatPage'
 
+import {
+  ColorBy,
+  Sex,
+  ColorByValue,
+  AlleleSizeDistributionItem,
+} from './ShortTandemRepeatAlleleSizeDistributionPlot'
+
 type AlleleSizeDistributionParams = {
   selectedPopulation: string | ''
   selectedSex: Sex | ''
diff --git a/browser/src/__factories__/ShortTandemRepeat.ts b/browser/src/__factories__/ShortTandemRepeat.ts
index 716782eeb..522949e85 100644
--- a/browser/src/__factories__/ShortTandemRepeat.ts
+++ b/browser/src/__factories__/ShortTandemRepeat.ts
@@ -49,7 +49,7 @@ const shortTandemRepeatFactory = Factory.define<ShortTandemRepeat>(({ params, as
         short_allele_repunit: 'ACCA',
         long_allele_repunit: 'GATA',
         quality_description: 'high',
-        q_score: '1.0',
+        q_score: '1',
         distribution: [
           { short_allele_repunit_count: 8, long_allele_repunit_count: 9, frequency: 15 },
           { short_allele_repunit_count: 8, long_allele_repunit_count: 10, frequency: 19 },

From b760f0a19e6e8efd9c01eae3249c5e0b030b9c97 Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Tue, 10 Dec 2024 11:20:17 -0500
Subject: [PATCH 35/36] updated Q legend labels

---
 ...TandemRepeatAlleleSizeDistributionPlot.tsx | 31 ++++++++++++-------
 1 file changed, 19 insertions(+), 12 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index 346ca39f8..f95ee1067 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -122,17 +122,17 @@ const qualityDescriptionLabels: Record<GenotypeQuality, string> = {
 }
 
 const qScoreLabels: Record<QScoreBin, string> = {
-  '0.0': '0',
-  '0.1': '0 < q ≤ 0.1',
-  '0.2': '0.1 < q ≤ 0.2',
-  '0.3': '0.2 < q ≤ 0.3',
-  '0.4': '0.3 < q ≤ 0.4',
-  '0.5': '0.4 < q ≤ 0.5',
-  '0.6': '0.5 < q ≤ 0.6',
-  '0.7': '0.6 < q ≤ 0.7',
-  '0.8': '0.7 < q ≤ 0.8',
-  '0.9': '0.8 < q ≤ 0.9',
-  '1': '0.9 < q ≤ 1',
+  '0.0': '0 to 0.05',
+  '0.1': '0.05 to 0.15',
+  '0.2': '0.15 to 0.25',
+  '0.3': '0.25 to 0.35',
+  '0.4': '0.35 to 0.45',
+  '0.5': '0.45 to 0.55',
+  '0.6': '0.55 to 0.65',
+  '0.7': '0.65 to 0.75',
+  '0.8': '0.75 to 0.85',
+  '0.9': '0.85 to 0.95',
+  '1': '0.95 to 1',
 }
 
 const fixedLegendLabels: Partial<Record<ColorBy, Record<string, string>>> = {
@@ -199,7 +199,14 @@ const LegendFromColorBy = ({ colorBy }: { colorBy: ColorBy | '' }) => {
   const labels = legendLabels(colorBy, [...keys])
   const colors = keys.map((key) => colorMap[colorBy][key])
   const scale = scaleOrdinal().domain(labels).range(colors)
-  return <LegendOrdinal scale={scale} direction="row" />
+  return (
+    <LegendOrdinal
+      scale={scale}
+      shapeMargin="0 7px 20px 0px"
+      labelMargin="0 10px 20px 0px"
+      direction="row"
+    />
+  )
 }
 
 const tooltipContent = (data: Bin, key: ColorByValue | ''): string => {

From 704726f7b20f0249696028a470e6675e0f37a016 Mon Sep 17 00:00:00 2001
From: bw2 <ben.weisburd@gmail.com>
Date: Tue, 10 Dec 2024 11:33:03 -0500
Subject: [PATCH 36/36] added more options to y-scale drop down

---
 .../ShortTandemRepeatAdjacentRepeatSection.tsx      |  4 +++-
 .../ShortTandemRepeatAlleleSizeDistributionPlot.tsx | 13 +++++++++++--
 .../ShortTandemRepeatColorBySelect.tsx              |  2 +-
 .../ShortTandemRepeatPage/ShortTandemRepeatPage.tsx |  4 +++-
 4 files changed, 18 insertions(+), 5 deletions(-)

diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
index e4bc13f98..06c073bcf 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAdjacentRepeatSection.tsx
@@ -122,8 +122,10 @@ const ShortTandemRepeatAdjacentRepeatSection = ({
             }}
           >
             <option value="linear">Linear</option>
-            <option value="linear-truncated">Linear: Truncated</option>
             <option value="log">Log</option>
+            <option value="linear-truncated-50">Linear: Truncated at 50</option>
+            <option value="linear-truncated-200">Linear: Truncated at 200</option>
+            <option value="linear-truncated-1000">Linear: Truncated at 1000</option>
           </Select>
         </label>
       </ControlSection>
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
index f95ee1067..e7c45c7a5 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatAlleleSizeDistributionPlot.tsx
@@ -28,7 +28,12 @@ const BarWithHoverEffect = styled(Bar)`
   }
 `
 
-export type ScaleType = 'linear' | 'linear-truncated' | 'log'
+export type ScaleType =
+  | 'linear'
+  | 'linear-truncated-50'
+  | 'linear-truncated-200'
+  | 'linear-truncated-1000'
+  | 'log'
 
 export const genotypeQualityKeys = [
   'low',
@@ -290,8 +295,12 @@ const ShortTandemRepeatAlleleSizeDistributionPlot = withSize()(
         .domain([1, 10 ** maxLog])
         .range([plotHeight, 0])
         .clamp(true)
-    } else if (scaleType === 'linear-truncated') {
+    } else if (scaleType === 'linear-truncated-50') {
       yScale = scaleLinear().domain([0, 50]).range([plotHeight, 0]).clamp(true)
+    } else if (scaleType === 'linear-truncated-200') {
+      yScale = scaleLinear().domain([0, 200]).range([plotHeight, 0]).clamp(true)
+    } else if (scaleType === 'linear-truncated-1000') {
+      yScale = scaleLinear().domain([0, 1000]).range([plotHeight, 0]).clamp(true)
     } else {
       yScale = scaleLinear()
         .domain([0, max(data, (d) => d.fullFrequency) || 1])
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
index 053e4ef27..6321188a0 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatColorBySelect.tsx
@@ -30,7 +30,7 @@ const ShortTandemRepeatColorBySelect = ({
         onChange={(e: { target: { value: ColorBy | '' } }) => {
           setSelectedColorBy(e.target.value)
           if (e.target.value === 'quality_description') {
-            setSelectedScaleType('linear-truncated')
+            setSelectedScaleType('linear-truncated-50')
           }
         }}
       >
diff --git a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
index 2fea726b1..3d2c1f6ec 100644
--- a/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
+++ b/browser/src/ShortTandemRepeatPage/ShortTandemRepeatPage.tsx
@@ -424,8 +424,10 @@ const ShortTandemRepeatPage = ({ datasetId, shortTandemRepeat }: ShortTandemRepe
               }}
             >
               <option value="linear">Linear</option>
-              <option value="linear-truncated">Linear: Truncated</option>
               {logScaleAllowed(selectedColorBy) && <option value="log">Log</option>}
+              <option value="linear-truncated-50">Linear: Truncated at 50</option>
+              <option value="linear-truncated-200">Linear: Truncated at 200</option>
+              <option value="linear-truncated-1000">Linear: Truncated at 1000</option>
             </Select>
           </label>
         </ControlSection>