diff --git a/build_search_index.py b/build_search_index.py new file mode 100644 index 0000000..fc0d1a8 --- /dev/null +++ b/build_search_index.py @@ -0,0 +1,172 @@ +#!/usr/bin/env python3 +""" +Build searchIndex.json for AlcHepNet website search functionality. +Indexes all active HTML pages (excludes backups, templates, and components). +""" + +import os +import re +import json +from pathlib import Path + +SRC_DIR = Path(__file__).parent / "src" +OUTPUT_FILE = SRC_DIR / "searchIndex.json" +PUBLICATIONS_JSON = SRC_DIR / "Publishing" / "doc" / "all_publications.json" +PUBLICATIONS_URL = "Publishing/publications.html" + +# Pages to exclude from index +EXCLUDE_PATTERNS = [ + r"\.backup", + r"-backup\.html$", + r"\.bk\.html$", + r"-bk\.html$", + r"navbar\.html$", + r"footer\.html$", + r"search-modal\.html$", + r"template", + r"page-template", +] + + +def should_exclude(filepath: Path) -> bool: + """Check if file should be excluded from index.""" + name = filepath.name + for pattern in EXCLUDE_PATTERNS: + if re.search(pattern, name, re.IGNORECASE): + return True + return False + + +def strip_html(html: str) -> str: + """Remove HTML tags and decode entities.""" + # Remove script and style blocks + text = re.sub(r"", " ", html, flags=re.DOTALL | re.IGNORECASE) + text = re.sub(r"", " ", text, flags=re.DOTALL | re.IGNORECASE) + # Remove all HTML tags + text = re.sub(r"<[^>]+>", " ", text) + # Collapse whitespace + text = re.sub(r"\s+", " ", text) + return text.strip() + + +def extract_title(html: str, filepath: Path) -> str: + """Extract page title from HTML.""" + match = re.search(r"
- The AlcHepNet Biorepository is a part of the Indiana University Data Coordinating Center (DCC). Its primary function is to support biospecimen collection for ongoing AlcHepNet studies. The DCC oversees the operation of the biorepository in partnership with the Indiana Biobank (IB), which is a state-of-the-art facility for biospecimen storage, tracking, and distribution. The biorepository team uses a comprehensive, searchable database to manage all biospecimens and the associated metadata. The DCC provides a link between stored biospecimen data to facilitate research. + The AlcHepNet Biorepository is a part of the Indiana University Data Coordinating Center (DCC). Its primary function is to support biospecimen collection for ongoing AlcHepNet studies. The DCC oversees the operation of the biorepository in partnership with the Indiana Biobank (IB), which is a state-of-the-art facility for biospecimen storage, tracking, and distribution. The biorepository team uses a comprehensive, searchable database to manage all biospecimens and the associated metadata. The DCC provides access to stored biospecimens, and the linkage between biospecimens and clinical data to facilitate research.
- The primary objective of the study is to determine whether subjects receiving F-652 followed by enhanced AUD treatments will have better alcohol and liver-related outcomes at 6 months compared to those receiving prednisone plus usual care for AUD. Patients assigned to the AUD treatment will receive Acamprosate and counseling, while those assigned to the AUD usual care will receive brief advice and referral to a 12-step program. + The primary objective of the study is to determine whether subjects receiving F-652 (recombinant IL-22) followed by enhanced AUD treatments will have better alcohol and liver-related outcomes at 6 months compared to those receiving prednisone plus usual care for AUD. Patients assigned to the AUD treatment will receive Acamprosate and counseling, while those assigned to the AUD usual care will receive brief advice and referral to a 12-step program.
diff --git a/src/Data_Access/design.html b/src/Data_Access/design.html index 399c5be..1215118 100644 --- a/src/Data_Access/design.html +++ b/src/Data_Access/design.html @@ -31,7 +31,7 @@
- The heterogeneous clinical data, biosample information, and omics data information will be extracted from the randomized clinical trial, the observational study, and all other alcohol-associated hepatitis (AH) research projects, standardized according to the ARDaC Data Standard, harmonized according to the ARDaC Common Data Model, and hosted in a central ARDaC Data Warehouse. Specifically, the novel ARDaC Common Data Model is derived from and compatible with the Genomics Data Common (GDC) Data Model and is compliant with the FAIR Principles so that AlcHepNet multimodal data will be findable, accessible, interoperable, and reusable. The ARDaC Data Warehouse is the data source for the ARDaC web application, which is open to the public, as well as for regular reporting and customized services within the AlcHepNet consortium. A graph-based provenance model is used for comprehensive data dependency and version control. The ARDaC digital entities, including the standards, data model, data, metadata, scripts, and codes, are attributable, trackable, and reproducible. + The heterogeneous clinical data, biosample information, and omics data information will be extracted from the randomized clinical trial and all other alcohol-associated hepatitis (AH) research projects, standardized according to the ARDaC Data Standard, harmonized according to the ARDaC Common Data Model, and hosted in a central ARDaC Data Warehouse. Specifically, the novel ARDaC Common Data Model is derived from and compatible with the Genomics Data Common (GDC) Data Model and is compliant with the FAIR Principles so that AlcHepNet multimodal data will be findable, accessible, interoperable, and reusable. The ARDaC Data Warehouse is the data source for the ARDaC web application, which is open to the public, as well as for regular reporting and customized services within the AlcHepNet consortium. A graph-based provenance model is used for comprehensive data dependency and version control. The ARDaC digital entities, including the standards, data model, data, metadata, scripts, and codes, are attributable, trackable, and reproducible.
- Data request can be submitted by the PIs of the AlcHepNet consortium. Internal - and external collaborators are encouraged, but the actual request must be submitted by one of the PIs. Data - requests by the PI automatically imply he/she is responsible for completing the study in a timely and rigorous - fashion, avoids "mission creep" and abides by other AlcHepNet policies. -
++ Data request can be submitted by the PIs of the AlcHepNet consortium. + Internal + and external collaborators are encouraged, but the actual request must be submitted by one of the PIs. + Data + requests by the PI automatically imply he/she is responsible for completing the study in a timely and + rigorous + fashion, avoids "mission creep" and abides by other AlcHepNet policies. +
-- Request process -
+ Request process +
This page is under construction. Content will be added soon.
-Latest updates, announcements, and publications from AlcHepNet
xxxx
+The ITAALD trial started enrollment in January 2026. The first two patients were enrolled at the Cleveland Clinic. Congratulations to the Cleveland Clinic team!
+xxxx
+Loading recent publications...
+The Alcohol-associated Hepatitis Network project, AlcHepNet, comprised of ten leading partner institutions in the field, will collect and organize patient information, associated data, and samples that can help shed greater light on this disease. Combined, these approaches will improve treatment and how we care for patients with this devastating liver condition.
-Alcohol-associated hepatitis (AH) is a leading cause of liver-related morbidity and mortality. This network represents a coordinated submission of several NIAAA-funded consortia that have come together as the Alcohol-associated Hepatitis Network (AlcHepNet). Collectively, the network will synergize efforts and expertise to better understand AH. The network aims to: -
-- Develop a multicenter, randomized, double-blinded, placebo-controlled trial focused on the treatment of severe alcohol-associated hepatitis (sAH) and alcohol use disorder (AUD). -
-- The primary purpose study is to determine whether subjects receiving AUD treatments combined with sAH therapies will improve alcohol and liver-related events at 6 months compared to usual care for AUD. Patients will receive either integrated treatment with acamprosate and counseling or standard care with brief advice and referral to a 12-step program. -
-- The secondary purpose of the study is to determine if F-652 is safe and effective in treating severe alcohol-associated hepatitis when compared to prednisone. Subjects will receive F-652 on days 1 and 7 or prednisone for 28 days. Outcomes will be measured by overall survival at 90 days. -
- -
-
-
-
-
- AlcHepNet is a clinical and translational research initiative funded by the National Institute on Alcohol Abuse and Alcoholism (NIAAA), a division of NIH.
-