diff --git a/etl.py b/etl.py index 2345502..846caea 100644 --- a/etl.py +++ b/etl.py @@ -10,9 +10,7 @@ INPUT_JSON = "hetionet-v1.0.json" OUTPUT_DIR = Path("neo4j_csv") OUTPUT_DIR.mkdir(exist_ok=True) -print("="*60) print("HETIONET ETL PIPELINE (OPTIMIZED + SPLIT EDGES)") -print("="*60) # extract @@ -146,9 +144,8 @@ for edge_type in sorted(edge_types): print(f" - {edge_type:20s}: {count:>10,} ({pct:>5.1f}%)") -print("\n" + "="*60) print("PHASE 4: ANALYSES") -print("="*60) + # analysis 1: hotspot genes print("\nAnalysis 1: Hotspot Genes")