Complete dropped albums list with all 89 truly dropped albums from 2020

- Added all 89 albums that were genuinely dropped from 2020 to 2023
- Fixed incorrect status markings (many albums marked "New in 2023" were not new)
- Removed duplicates and albums incorrectly marked as dropped
- Final count: 589 total (500 main list + 89 dropped)
- Updated JavaScript validation for extended range
- Created comprehensive analysis scripts to verify data

Math now adds up correctly: 89 albums dropped to make room for new additions

🤖 Generated with [Claude Code](https://claude.ai/code)

Co-Authored-By: Claude <noreply@anthropic.com>
This commit is contained in:
Johan Lundberg 2025-07-01 01:14:06 +02:00
parent a2713e9fb1
commit c3a24799c8
12 changed files with 1348 additions and 8 deletions

65
scripts/find_truly_new.py Normal file
View file

@ -0,0 +1,65 @@
#!/usr/bin/env python3
"""
Find albums that are TRULY new in 2023 (not in 2020 list at all).
"""
import csv
def normalize_text(text):
"""Normalize text for comparison"""
return text.lower().strip().replace('&', 'and').replace(' ', ' ')
def main():
# Read 2020 albums
albums_2020 = set()
with open('rolling_stone_2020_simple.csv', 'r', encoding='utf-8') as file:
reader = csv.DictReader(file)
for row in reader:
key = (normalize_text(row['Artist']), normalize_text(row['Album']))
albums_2020.add(key)
print(f"📊 Loaded {len(albums_2020)} albums from 2020 list")
# Read 2023 albums and find truly new ones
truly_new = []
incorrectly_marked_new = []
with open('top_500_albums_2023.csv', 'r', encoding='utf-8') as file:
reader = csv.DictReader(file)
for row in reader:
rank = int(row['Rank'])
if rank <= 500:
key = (normalize_text(row['Artist']), normalize_text(row['Album']))
if row['Status'] == 'New in 2023':
if key not in albums_2020:
truly_new.append({
'rank': row['Rank'],
'artist': row['Artist'],
'album': row['Album']
})
else:
incorrectly_marked_new.append({
'rank': row['Rank'],
'artist': row['Artist'],
'album': row['Album']
})
print(f"\n✅ TRULY new albums in 2023 (not in 2020 list):")
print("=" * 80)
for album in truly_new:
print(f"#{album['rank']:3s} - {album['artist']} - {album['album']}")
print("=" * 80)
print(f"Total truly new: {len(truly_new)}")
print(f"\n❌ Incorrectly marked as 'New in 2023' (were in 2020 list):")
print("=" * 80)
for album in incorrectly_marked_new[:10]: # Show first 10
print(f"#{album['rank']:3s} - {album['artist']} - {album['album']}")
if len(incorrectly_marked_new) > 10:
print(f"... and {len(incorrectly_marked_new) - 10} more")
print("=" * 80)
print(f"Total incorrectly marked: {len(incorrectly_marked_new)}")
if __name__ == "__main__":
main()