possibly the last of the matches

johnseekins · johnseekins · commit f8c1473974cc · 2025-09-24T22:48:21.000-06:00
Signed-off-by: John Seekins &lt;john@robot-house.us&gt;
diff --git a/ice_scrapers/utils.py b/ice_scrapers/utils.py
@@ -166,6 +166,7 @@ def repair_name(name: str, locality: str) -> Tuple[str, bool]:
             "replace": "WASHINGTON COUNTY JAIL",
             "locality": "HURRICANE",
         },
+        {"match": "ETOWAH COUNTY JAIL (ALABAMA)", "replace": "ETOWAH COUNTY JAIL", "locality": "GADSDEN"},
     ]
     cleaned = False
     for m in matches:
diff --git a/ice_scrapers/vera_data.py b/ice_scrapers/vera_data.py
@@ -157,6 +157,27 @@ def _vera_name_fixes(name: str, city: str) -> Tuple[str, bool]:
             "replace": "Chittenden Regional Correctional Facility",
             "city": "South Burlington",
         },
+        {
+            "match": "NW Regional Corrections Center",
+            "replace": "Northwest Regional Corrections Center",
+            "city": "Crookston",
+        },
+        {
+            "match": "Lasalle ICE Processing Center",
+            "replace": "Central Louisiana ICE Processing Center (CLIPC)",
+            "city": "Jena",
+        },
+        {
+            "match": "La Salle Co Regional Det. Center",
+            "replace": "La Salle County Regional Detention Center",
+            "city": "Encinal",
+        },
+        {
+            "match": "Hancock Co Pub Sfty Cplx",
+            "replace": "Hancock County Public Safety Complex",
+            "city": "Bay St. Louis",
+        },
+        {"match": "Brooks County Jail (Contract)", "replace": "Brooks County Jail", "city": "Falfurrias"},
     ]
     fixed = False
     for m in matches:
@@ -196,7 +217,7 @@ def collect_vera_facility_data(facilities_data: dict, keep_sheet: bool = True, f
     df = polars.read_csv(has_header=True, raise_if_empty=True, source=filename, use_pyarrow=True)
     if df.is_empty():
         raise ValueError("Empty CSV loaded somehow! %s", df)
-    # first step to removing duplicates is easy
+    # first step to removing duplicates is easy, but unlikely to actually filter anything
     df = df.unique()
     logger.debug("Extracted data: %s", df)
     """

Original file line number	Diff line number	Diff line change
`@@ -166,6 +166,7 @@ def repair_name(name: str, locality: str) -> Tuple[str, bool]:`
`166`	`166`	`"replace": "WASHINGTON COUNTY JAIL",`
`167`	`167`	`"locality": "HURRICANE",`
`168`	`168`	`},`
	`169`	`+ {"match": "ETOWAH COUNTY JAIL (ALABAMA)", "replace": "ETOWAH COUNTY JAIL", "locality": "GADSDEN"},`
`169`	`170`	`]`
`170`	`171`	`cleaned = False`
`171`	`172`	`for m in matches:`