-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathyt.py
71 lines (58 loc) · 2.46 KB
/
yt.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
from youtube_title_parse import get_artist_title
from googleapiclient.discovery import build
from oauth2client.tools import argparser
from dataclasses import dataclass
from pprint import pprint
import re
import os
@dataclass
class Song:
artist: str
title: str
def clean_song_info(song: Song) -> Song:
artist, title = song.artist, song.title
title = re.sub('\(.*', '', title) # Remove everything after '(' including '('
title = re.sub('ft.*', '', title) # Remove everything after 'ft' including 'ft'
title = re.sub(',.*', '', title) # Remove everything after ',' including ','
artist = re.sub('\sx\s.*', '', artist) # Remove everything after ' x ' including ' x '
artist = re.sub('\(.*', '', artist) # Remove everything after '(' including '('
artist = re.sub('ft.*', '', artist) # Remove everything after 'ft' including 'ft'
artist = re.sub(',.*', '', artist) # Remove everything after ',' including ','
return Song(artist.strip(), title.strip()) # Remove whitespaces from start and end
class Youtube:
DEVELOPER_KEY = os.getenv('YOUTUBE_API_KEY')
YOUTUBE_API_SERVICE_NAME = "youtube"
YOUTUBE_API_VERSION = "v3"
def __init__(self):
self.songs = []
self.youtube = build(
Youtube.YOUTUBE_API_SERVICE_NAME,
Youtube.YOUTUBE_API_VERSION,
developerKey=Youtube.DEVELOPER_KEY
)
def __fetch_songs(self, youtube, playlist_id, page_token=None):
result = youtube.playlistItems().list(
part="snippet",
playlistId=playlist_id,
maxResults="300",
pageToken=page_token
).execute()
for item in result['items']:
song = item['snippet']['title']
try:
artist, title = get_artist_title(song)
self.songs.append(clean_song_info(Song(artist, title)))
except:
print(f'Error parsing {song}')
return result
def get_songs_from_playlist(self, playlist_id: str):
youtube = self.youtube
result = self.__fetch_songs(youtube, playlist_id)
while 'nextPageToken' in result:
page_token = result['nextPageToken']
result = self.__fetch_songs(youtube, playlist_id, page_token)
return self.songs
if __name__ == "__main__":
yt = Youtube()
print(clean_song_info(Song('Michael Jackson', 'Billie Jean')))
pprint(yt.get_songs_from_playlist(''))