From f2eec0afd9f78ef319d0a4220acf6864db48171b Mon Sep 17 00:00:00 2001 From: Eduard Prigoana Date: Tue, 19 Aug 2025 08:15:02 +0300 Subject: [PATCH] a --- config.py | 3 +++ info/status.json | 10 +++++----- parser.py | 5 ++++- 3 files changed, 12 insertions(+), 6 deletions(-) diff --git a/config.py b/config.py index 655707f..19e2d7a 100644 --- a/config.py +++ b/config.py @@ -15,7 +15,10 @@ exclude_names = { "K4HKn0", "AI Models", "🎹 BPM & Key Tracker", + "🎹Comps & Edits" "🎹 Worst Comps & Edits", + "🎹Worst Comps & Edits", + "🎹 Yedits", "Allegations", "Rap Disses Timeline", "Underground Artists", diff --git a/info/status.json b/info/status.json index e501091..4598760 100644 --- a/info/status.json +++ b/info/status.json @@ -1,15 +1,15 @@ { - "last_updated": "2025-08-11T17:26:51.365776Z", + "last_updated": "2025-08-19T05:14:17.304876Z", "files": { "Artists.html": { - "hash": "5c794c69a86112ac86a59c25f62409754b692b08ab57c4555afa9e45721ed054", - "last_archived": "2025-08-11T17:26:51.365790Z" + "hash": "b48e3d341500e82e179f8813443e5fed899313b48ef79b83bd87388189c49a90", + "last_archived": "2025-08-19T05:14:17.304886Z" }, "artists.csv": { - "hash": "f65b4bac779810e9f6775f3d98505d876e2692233c2581bd4a53471c8cf188ac" + "hash": "609ab1ad6adf62bc1ab8e1b433e1676ab6787e65c760e22d7da7a8e26bbdf33e" }, "artists.xlsx": { - "hash": "f41e3527911e55863c3cc4e0cec778bb689d8d6d5086c53fe964df963583b910" + "hash": "101b6cdef091774668b030bd1bed27a78cb227b487f5f04883c7a2f4bb184b5e" } } } \ No newline at end of file diff --git a/parser.py b/parser.py index c848eb5..7958e0c 100644 --- a/parser.py +++ b/parser.py @@ -19,8 +19,11 @@ def generate_csv(): if len(cells) < 4: continue + # Always take the artist name from the column text + artist_name_raw = cells[0].get_text(strip=True) + + # Only use the for the URL (if it exists) link_tag = cells[0].find("a") - artist_name_raw = link_tag.get_text(strip=True) if link_tag else cells[0].get_text(strip=True) artist_url = link_tag["href"] if link_tag else "" if not artist_url: continue