freelawproject · albertisfu · Feb 7, 2025 · Jan 27, 2025 · Jan 31, 2025 · Jan 31, 2025
diff --git a/cl/corpus_importer/utils.py b/cl/corpus_importer/utils.py
@@ -107,6 +107,23 @@ async def mark_ia_upload_needed(d: Docket, save_docket: bool) -> None:
         await d.asave()
 
 
+def is_bankruptcy_court(court_id: str) -> bool:
+    """Checks if a given court ID corresponds to a bankruptcy court.
+
+    This function queries the database to determine if the provided court
+    ID is associated with a federal bankruptcy court.
+
+    Args:
+        court_id: The ID of the court to check (string).
+
+    Returns:
+        True if the court ID corresponds to a bankruptcy court, False otherwise
+        (boolean).
+    """
+    bankr_court_ids = Court.federal_courts.bankruptcy_pacer_courts()
+    return bankr_court_ids.filter(pk=court_id).exists()
+
+
 def is_appellate_court(court_id: str) -> bool:
     """Checks if the given court_id belongs to an appellate court.
 

diff --git a/cl/lib/search_index_utils.py b/cl/lib/search_index_utils.py
@@ -1,3 +1,4 @@
+import re
 from datetime import date
 
 from cl.lib.date_time import midnight_pt
@@ -40,6 +41,8 @@ def __init__(self, message):
     list(range(0, 10)) + list(range(11, 13)) + list(range(14, 32))
 )
 
+VALID_CASE_NAME_SEPARATORS = [" v ", " v. ", " vs. ", " vs "]
+
 
 def get_parties_from_case_name(case_name: str) -> list[str]:
     """Extracts the parties from case_name by splitting on common case_name
@@ -49,14 +52,46 @@ def get_parties_from_case_name(case_name: str) -> list[str]:
     :return: A list of parties. If no valid separator is found, returns an
     empty list.
     """
-
-    valid_case_name_separators = [
-        " v ",
-        " v. ",
-        " vs. ",
-        " vs ",
-    ]
-    for separator in valid_case_name_separators:
+    for separator in VALID_CASE_NAME_SEPARATORS:
         if separator in case_name:
             return case_name.split(separator, 1)
     return []
+
+
+def get_parties_from_case_name_bankr(case_name: str) -> list[str]:
+    """Extracts the parties involved in a bankruptcy case from the case name.
+
+    This function attempts to identify the parties by splitting the case name
+    string based on common separators. It also performs some cleanup to
+    remove extraneous information like court designations in parentheses,
+    trailing HTML, and text related to "BELOW" or "ABOVE" designations.
+
+    If the case name begins with "in re" or "in the matter of", an empty list
+    is returned, as these typically don't contain party information in the
+    standard format.
+
+    :param case_name: The bankruptcy case name string.
+    :return: A list of strings, where each string represents a party involved
+    in the case. If no recognized separator is found, the function returns
+    a list containing the cleaned case name as a single element.
+    """
+    # Handle cases beginning with "in re" or "in the matter of".
+    # These usually don't contain party information in the expected format.
+    if re.match(r"^(in re|in the matter of)", case_name, re.IGNORECASE):
+        return []
+
+    # Removes text enclosed in parentheses at the end of the string.
+    cleaned_case_name = re.sub(r"\s*\([^)]*\)$", "", case_name)
+
+    # Removes any HTML at the end of the string.
+    cleaned_case_name = re.sub(r"\s*<.*$", "", cleaned_case_name)
+
+    # Removes text following "-BELOW" or "-ABOVE" at the end of the string.
+    cleaned_case_name = re.sub(r"\s*(-BELOW|-ABOVE).*$", "", cleaned_case_name)
+
+    case_name_separators = VALID_CASE_NAME_SEPARATORS.copy()
+    case_name_separators.append(" and ")
+    for separator in case_name_separators:
+        if separator in case_name:
+            return cleaned_case_name.split(separator, 1)
+    return [cleaned_case_name]
diff --git a/cl/lib/tests.py b/cl/lib/tests.py
@@ -39,6 +39,7 @@
     get_redis_interface,
     release_redis_lock,
 )
+from cl.lib.search_index_utils import get_parties_from_case_name_bankr
 from cl.lib.string_utils import normalize_dashes, trunc
 from cl.lib.utils import (
     check_for_proximity_tokens,
@@ -1203,6 +1204,117 @@ def test_check_and_sanitize_queries_bad_syntax(self) -> None:
             )
             self.assertEqual(output, test["sanitized"])
 
+    def test_can_get_parties_from_bankruptcy_case_name(self) -> None:
+        class PartiesNameTestType(TypedDict):
+            case_name: str
+            output: list[str]
+
+        tests: list[PartiesNameTestType] = [
+            {
+                "case_name": "Mendelsohn. Singh",
+                "output": ["Mendelsohn. Singh"],
+            },
+            {
+                "case_name": "Cadle Co. v Matos",
+                "output": ["Cadle Co.", "Matos"],
+            },
+            {
+                "case_name": "Cadle Co. v Matos",
+                "output": ["Cadle Co.", "Matos"],
+            },
+            {
+                "case_name": "Cadle Co. v. Matos",
+                "output": ["Cadle Co.", "Matos"],
+            },
+            {
+                "case_name": "Cadle Co. vs Matos",
+                "output": ["Cadle Co.", "Matos"],
+            },
+            {
+                "case_name": "Cadle Co. vs. Matos",
+                "output": ["Cadle Co.", "Matos"],
+            },
+            {
+                "case_name": "Paul Thomas Presbury, Jr. and Lisa Rae Presbury",
+                "output": ["Paul Thomas Presbury, Jr.", "Lisa Rae Presbury"],
+            },
+            {
+                "case_name": "Ma Margarita Bernal Sosa -ABOVE MED",
+                "output": ["Ma Margarita Bernal Sosa"],
+            },
+            {
+                "case_name": "Jennifer Renee' Abbott and Quentin Andrew Abbott -ABOVE MED",
+                "output": ["Jennifer Renee' Abbott", "Quentin Andrew Abbott"],
+            },
+            {
+                "case_name": "Aiesha Renee -BELOW MED",
+                "output": ["Aiesha Renee"],
+            },
+            {
+                "case_name": "Justin Kaiser and Belinda Kaiser -BELOW MED",
+                "output": ["Justin Kaiser", "Belinda Kaiser"],
+            },
+            {
+                "case_name": "Cosmorex Ltd. (in Liquidation)",
+                "output": ["Cosmorex Ltd."],
+            },
+            {
+                "case_name": "Cowen & Co. v. Zagar (In re Zagar)",
+                "output": ["Cowen & Co.", "Zagar"],
+            },
+            {
+                "case_name": 'Advantage LLC <b><font color="red">Jointly Administered under 23-90886.</font></b>',
+                "output": ["Advantage LLC"],
+            },
+            {
+                "case_name": 'Sather v. Carlson<b><font color="red">DO NOT DOCKET. CASE TRANSFERRED OUT.</font></b>',
+                "output": ["Sather", "Carlson"],
+            },
+            {
+                "case_name": 'Saucedo and Green Dream International, LLC <b> <font color="red"> Case Consolidated under 23-03142 </font> </b>',
+                "output": ["Saucedo", "Green Dream International, LLC"],
+            },
+            {
+                "case_name": "In re: Matter of Nicholas M. Wajda",
+                "output": [],
+            },
+            {
+                "case_name": "In re Matter of Proof of Claim Replacement Filings",
+                "output": [],
+            },
+            {
+                "case_name": "In re T.H.",
+                "output": [],
+            },
+            {
+                "case_name": "In Re: Dempsey Clay Ward",
+                "output": [],
+            },
+            {
+                "case_name": "In re: Receivership of Horses and Equipment v. Gabriel",
+                "output": [],
+            },
+            {
+                "case_name": "In Re: Appearances of Attorney James G. ORourke in Pending Bankruptcy Cases",
+                "output": [],
+            },
+            {
+                "case_name": "In the matter of Attorney Rodney D. Shepherd",
+                "output": [],
+            },
+        ]
+        for test in tests:
+            with self.subTest(
+                input=test["case_name"], msg="get parties names from case name"
+            ):
+                parties: list[str] = get_parties_from_case_name_bankr(
+                    test["case_name"]
+                )
+                self.assertEqual(
+                    parties,
+                    test["output"],
+                )
+
 
 class TestRedisUtils(SimpleTestCase):
     """Test Redis utils functions."""

diff --git a/cl/search/documents.py b/cl/search/documents.py
@@ -8,14 +8,19 @@
 
 from cl.alerts.models import Alert
 from cl.audio.models import Audio
+from cl.corpus_importer.utils import is_bankruptcy_court
 from cl.custom_filters.templatetags.text_filters import (
     best_case_name,
     html_decode,
 )
 from cl.lib.command_utils import logger
 from cl.lib.elasticsearch_utils import build_es_base_query
 from cl.lib.fields import JoinField, PercolatorField
-from cl.lib.search_index_utils import get_parties_from_case_name, null_map
+from cl.lib.search_index_utils import (
+    get_parties_from_case_name,
+    get_parties_from_case_name_bankr,
+    null_map,
+)
 from cl.lib.utils import deepgetattr
 from cl.people_db.models import (
     Attorney,
@@ -1258,8 +1263,10 @@ def prepare_parties(self, instance):
         if not out["party"]:
             # Get party from docket case_name if no normalized parties are
             # available.
-            party_from_case_name = get_parties_from_case_name(
-                instance.case_name
+            party_from_case_name = (
+                get_parties_from_case_name_bankr(instance.case_name)
+                if is_bankruptcy_court(instance.court_id)
+                else get_parties_from_case_name(instance.case_name)
             )
             out["party"] = party_from_case_name if party_from_case_name else []
 

diff --git a/cl/search/tasks.py b/cl/search/tasks.py
@@ -32,8 +32,12 @@
 )
 from cl.audio.models import Audio
 from cl.celery_init import app
+from cl.corpus_importer.utils import is_bankruptcy_court
 from cl.lib.elasticsearch_utils import build_daterange_query
-from cl.lib.search_index_utils import get_parties_from_case_name
+from cl.lib.search_index_utils import (
+    get_parties_from_case_name,
+    get_parties_from_case_name_bankr,
+)
 from cl.people_db.models import Person, Position
 from cl.search.documents import (
     ES_CHILD_ID,
@@ -316,8 +320,14 @@ def document_fields_to_update(
                             # parties are available.
                             if main_instance.parties.exists():
                                 continue
-                            field_value = get_parties_from_case_name(
-                                main_instance.case_name
+                            field_value = (
+                                get_parties_from_case_name_bankr(
+                                    main_instance.case_name
+                                )
+                                if is_bankruptcy_court(main_instance.court_id)
+                                else get_parties_from_case_name(
+                                    main_instance.case_name
+                                )
                             )
                         else:
                             field_value = getattr(related_instance, field)