#!/usr/bin/env python """ --> Parse library and just do JSON adapted for Elasticsearch iTunes Graph Parser Parses an iTunes library XML file and generates a JSON file for use in the D3.js JavaScript library. Example Track info: { 'Album': 'Nirvana', 'Persistent ID': 'A50FE1436726815C', 'Track Number': 4, 'Location': 'file://localhost/Users/foo/Music/iTunes/iTunes%20Music/Nirvana/Nirvana/04%20Sliver.mp3', 'File Folder Count': 4, 'Album Rating Computed': True, 'Total Time': 134295, 'Sample Rate': 44100, 'Genre': 'Rock/Alternative', 'Bit Rate': 236, 'Kind': 'MPEG audio file', 'Name': 'Sliver', 'Artist': 'Nirvana', 'Date Added': datetime.datetime(2006, 10, 11, 4, 31, 38), 'Album Rating': 60, 'Rating': 40, 'Date Modified': datetime.datetime(2009, 7, 18, 4, 57, 41), 'Library Folder Count': 1, 'Year': 2002, 'Track ID': 7459, 'Size': 3972838, 'Track Type': 'File', 'Play Count': 2, 'Play Date UTC': datetime.datetime(2009, 7, 18, 5, 00, 00) } """ from __future__ import division from optparse import OptionParser import os import io import plistlib import json import datetime import sys class SetEncoder(json.JSONEncoder): def default(self, obj): if isinstance(obj, set): return list(obj) if isinstance(obj, datetime.datetime): return obj.isoformat() # encoded_object = int(mktime(obj.timetuple())) return json.JSONEncoder.default(self, obj) class ITunesParser: """ Parse an iTunes Library and produce JSON - for ELS """ def __init__(self, library_file): self._albums = {} self._artists = {} self.library_file = library_file def to_json(self): """ Just do processSong() - This method suck """ ret = self._process_songs() # self._write_artists() # self._write_albums() # return json.dumps(jsonObj, indent=indent, cls=SetEncoder) return ret def to_json_p(self): # TODO parameter, rating=4): """ Produce JSON-P content """ json_content = self.to_json() jsonp = ';itgCallback(' + json_content + ');' return jsonp def _read_tracks(self): """ Read library and return Tracks part """ plist = plistlib.readPlist(self.library_file) return plist['Tracks'] def _process_songs(self): """ Return an output JSON for an ELS Bulk request - Not a correct format TODO Just return a _correct_ JSON and treat in another place/class """ tracks = self._read_tracks() ret = "" for k in tracks: track = tracks[k] # Filter out any non-music if track['Track Type'] != 'File': continue if 'Podcast' in track or 'Has Video' in track: continue persistent_id = track['Persistent ID'] json_track_index = { "index": {"_index": "itunessongs", "_type": "song", "_id": persistent_id} } # Retrieve for each track artist information self._process_artist(track) # Retrieve for each track album information self._process_album(track) ret += json.dumps(json_track_index, indent=None, cls=SetEncoder) ret += "\n" ret += json.dumps(track, indent=None, cls=SetEncoder) ret += "\n" return ret def _process_artist(self, track): """ Process artists in the track part of library and return a JSON formated for a bulk ELS request """ if 'Artist' not in track: return akey = track['Artist'] # Add artist if akey not in self._artists: self._artists[akey] = { 'id': len(self._artists), 'name': akey, 'count': 0, 'plays': 0, 'rating': 0, 'genres': set() } # Compute information rating = (track['Rating'] // 20) if 'Rating' in track else 0 plays = track['Play Count'] if 'Play Count' in track else 0 self._artists[akey]['count'] += 1 self._artists[akey]['rating'] += rating self._artists[akey]['plays'] += plays if 'Genre' not in track: return # Split up the Genres genre_parts = track['Genre'].split('/') self._artists[akey]['genres'] |= set(genre_parts) return def _process_album(self, track): """ Process albums in the track part of library and return a JSON formated for a bulk ELS request """ if 'Album' not in track: return akey = track['Album'] if akey not in self._albums: self._albums[akey] = { 'id': len(self._albums), 'name': akey, 'count': 0, 'plays': 0, 'rating': 0, 'genres': set(), 'artist': set() } # Compute information rating = (track['Rating'] // 20) if 'Rating' in track else 0 plays = track['Play Count'] if 'Play Count' in track else 0 self._albums[akey]['count'] += 1 self._albums[akey]['rating'] += rating self._albums[akey]['plays'] += plays if 'Genre' not in track: return # Split up the Genres genre_parts = track['Genre'].split('/') self._albums[akey]['genres'] |= set(genre_parts) ## Add different artists if 'Artist' not in track: return self._albums[akey]['artist'].add(track['Artist']) return def _write_artists(self): """ Write artists data to another JSON file """ file_artist = io.open('es-artist-data.json', 'wb') for artist in self._artists: json_track_index = { "index": {"_index": "itunessongs", "_type": "artist"} } file_artist.write(bytes(json.dumps(json_track_index, indent=None, cls=SetEncoder), 'UTF-8')) file_artist.write(bytes("\n", 'UTF-8')) file_artist.write(bytes(json.dumps(self._artists[artist], indent=None, cls=SetEncoder), 'UTF-8')) file_artist.write(bytes("\n", 'UTF-8')) file_artist.close() def _write_albums(self): """ Write albums data to another JSON file """ file_albums = io.open('es-albums-data.json', 'wb') for album in self._albums: json_track_index = { "index": {"_index": "itunessongs", "_type": "album"} } file_albums.write(bytes(json.dumps(json_track_index, indent=None, cls=SetEncoder), 'UTF-8')) file_albums.write(bytes("\n", 'UTF-8')) file_albums.write(bytes(json.dumps(self._albums[album], indent=None, cls=SetEncoder), 'UTF-8')) file_albums.write(bytes("\n", 'UTF-8')) file_albums.close() #### main block #### # Default input & output files DEFAULT_LIBRARY_FILE = os.path.expanduser('iTunesMiniLibrary.xml') DEFAULT_OUTPUT_FILE = os.path.dirname(os.path.realpath(__file__)) + '/es-music-data.json' # Get options parser = OptionParser(version="%prog 1.0") parser.add_option('-f', '--file', dest='file', type='string', help='iTunes Library XML file path', default=DEFAULT_LIBRARY_FILE) parser.add_option('-o', '--output', dest='output', type='string', help='Output to file (default=./js/music-data.json)', default=DEFAULT_OUTPUT_FILE) parser.add_option('-c', '--console', dest='console', action='store_true', help='Output to console instead of file') parser.add_option('-p', '--jsonp', dest='jsonp', action='store_true', help='Output in JSON-P format') parser.add_option('-v', '--verbose', dest='verbose', action='store_true', help='Verbose output') if __name__ == '__main__': (options, args) = parser.parse_args() itunes_parser = ITunesParser(options.file) if options.jsonp: output = itunes_parser.to_json_p() else: output = itunes_parser.to_json() if options.console: print(output) else: with io.open(options.output, 'wb') as outfile: if sys.version_info.major == 2: outfile.write(bytes(output)) elif sys.version_info.major == 3: outfile.write(bytes(output, 'UTF-8')) print('JSON data written to: ' + options.output)