silo.pasta/LastFM.py

import os
import csv
import json
import logging
from operator import attrgetter
from collections import namedtuple
import requests
import arrow
from datetime import datetime
import settings
import keys
from pprint import pprint
from math import floor
from common import cached_property
import sys

Track = namedtuple(
    "Track", ["timestamp", "artist", "album", "title", "artistid", "albumid", "img"]
)

class LastFM(object):
    url = "http://ws.audioscrobbler.com/2.0/"

    def __init__(self):
        self.params = {
            "method": "user.getrecenttracks",
            "user": keys.lastfm.get("username"),
            "api_key": keys.lastfm.get("key"),
            "format": "json",
            "limit": "200",
        }
        # if os.path.isfile(self.target):
            # mtime = os.path.getmtime(self.target)
            # self.params.update({"from": mtime})

    @property
    def target(self):
        return os.path.join(settings.paths.get("archive"), "lastfm.csv")

    @cached_property
    def existing(self):
        timestamps = []
        if os.path.isfile(self.target):
            with open(self.target, "r") as f:
                r = csv.reader(f)
                for row in r:
                    try:

                        timestamps.append(int(datetime.fromisoformat(row[0]).timestamp()))
                    except Exception as e:
                        logging.error("arrow failed on row %s as: %s", row[0], e)
                        continue
        return timestamps

    @property
    def exists(self):
        return os.path.isfile(self.target)

    def extracttracks(self, data):
        tracks = []
        if not data:
            return tracks
        for track in data.get("track", []):
            if "date" not in track:
                continue
            ts = arrow.get(int(track.get("date").get("uts")))
            if ts.timestamp in self.existing:
                continue
            entry = Track(
                ts.format("YYYY-MM-DDTHH:mm:ssZZ"),
                track.get("artist").get("#text", ""),
                track.get("album").get("#text", ""),
                track.get("name", ""),
                track.get("artist").get("mbid", ""),
                track.get("album").get("mbid", ""),
                track.get("image", [])[-1].get("#text", ""),
            )
            tracks.append(entry)
        return tracks

    def fetch(self):
        r = requests.get(self.url, params=self.params)
        return json.loads(r.text).get("recenttracks")

    def run(self):
        if len(self.existing):
            self.params.update({"from": sorted(self.existing)[-1]})
        #startpage = max(1, floor(len(self.existing) / int(self.params.get("limit"))))
        #startpage = 1
        self.params.update({"page": 1})
        try:
            data = self.fetch()
            tracks = self.extracttracks(data)
            total = int(data.get("@attr").get("totalPages"))
            current = int(data.get("@attr").get("page"))
            cntr = total - current
        except Exception as e:
            logging.error("Something went wrong: %s", e)
            return

        if not len(tracks):
            return

        while cntr > 0:
            current = current + 1
            cntr = total - current
            logging.info("requesting page #%d of paginated results", current)
            self.params.update({"page": current})
            data = self.fetch()
            tracks = tracks + self.extracttracks(data)

        if not self.exists:
            with open(self.target, "w") as f:
                writer = csv.DictWriter(f, fieldnames=Track._fields)
                writer.writeheader()

        if len(tracks):
            with open(self.target, "a") as f:
                writer = csv.writer(f, quoting=csv.QUOTE_NONNUMERIC)
                writer.writerows(sorted(tracks, key=attrgetter("timestamp")))


if __name__ == "__main__":
    lfm = LastFM()
    lfm.run()
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`import os`
			`import csv`
			`import json`
			`import logging`
			`from operator import attrgetter`
			`from collections import namedtuple`
			`import requests`
			`import arrow`
small updates & fixes 2023-06-01 18:06:30 +01:00			`from datetime import datetime`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`import settings`
			`import keys`
			`from pprint import pprint`
last.fm bug fix 2019-10-19 10:07:37 +01:00			`from math import floor`
I lost track of changes, this is a commit that has to be followed by a large cleanup 2020-05-06 13:27:49 +01:00			`from common import cached_property`
small updates & fixes 2023-06-01 18:06:30 +01:00			`import sys`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00
			`Track = namedtuple(`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`"Track", ["timestamp", "artist", "album", "title", "artistid", "albumid", "img"]`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`)`

			`class LastFM(object):`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`url = "http://ws.audioscrobbler.com/2.0/"`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00
			`def __init__(self):`
			`self.params = {`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`"method": "user.getrecenttracks",`
			`"user": keys.lastfm.get("username"),`
			`"api_key": keys.lastfm.get("key"),`
			`"format": "json",`
			`"limit": "200",`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`}`
I lost track of changes, this is a commit that has to be followed by a large cleanup 2020-05-06 13:27:49 +01:00			`# if os.path.isfile(self.target):`
			`# mtime = os.path.getmtime(self.target)`
			`# self.params.update({"from": mtime})`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00
			`@property`
			`def target(self):`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`return os.path.join(settings.paths.get("archive"), "lastfm.csv")`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00
fix to skip Lastfm if the served data is bogus or empty 2019-04-29 09:29:50 +01:00			`@cached_property`
			`def existing(self):`
			`timestamps = []`
I lost track of changes, this is a commit that has to be followed by a large cleanup 2020-05-06 13:27:49 +01:00			`if os.path.isfile(self.target):`
			`with open(self.target, "r") as f:`
			`r = csv.reader(f)`
			`for row in r:`
			`try:`
small updates & fixes 2023-06-01 18:06:30 +01:00
			`timestamps.append(int(datetime.fromisoformat(row[0]).timestamp()))`
I lost track of changes, this is a commit that has to be followed by a large cleanup 2020-05-06 13:27:49 +01:00			`except Exception as e:`
small updates & fixes 2023-06-01 18:06:30 +01:00			`logging.error("arrow failed on row %s as: %s", row[0], e)`
I lost track of changes, this is a commit that has to be followed by a large cleanup 2020-05-06 13:27:49 +01:00			`continue`
fix to skip Lastfm if the served data is bogus or empty 2019-04-29 09:29:50 +01:00			`return timestamps`

initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`@property`
			`def exists(self):`
			`return os.path.isfile(self.target)`

			`def extracttracks(self, data):`
			`tracks = []`
fix to skip Lastfm if the served data is bogus or empty 2019-04-29 09:29:50 +01:00			`if not data:`
			`return tracks`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`for track in data.get("track", []):`
			`if "date" not in track:`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`continue`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`ts = arrow.get(int(track.get("date").get("uts")))`
fix to skip Lastfm if the served data is bogus or empty 2019-04-29 09:29:50 +01:00			`if ts.timestamp in self.existing:`
			`continue`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`entry = Track(`
small updates & fixes 2023-06-01 18:06:30 +01:00			`ts.format("YYYY-MM-DDTHH:mm:ssZZ"),`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`track.get("artist").get("#text", ""),`
			`track.get("album").get("#text", ""),`
			`track.get("name", ""),`
			`track.get("artist").get("mbid", ""),`
			`track.get("album").get("mbid", ""),`
			`track.get("image", [])[-1].get("#text", ""),`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`)`
			`tracks.append(entry)`
			`return tracks`

			`def fetch(self):`
			`r = requests.get(self.url, params=self.params)`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`return json.loads(r.text).get("recenttracks")`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00
			`def run(self):`
I lost track of changes, this is a commit that has to be followed by a large cleanup 2020-05-06 13:27:49 +01:00			`if len(self.existing):`
			`self.params.update({"from": sorted(self.existing)[-1]})`
			`#startpage = max(1, floor(len(self.existing) / int(self.params.get("limit"))))`
			`#startpage = 1`
			`self.params.update({"page": 1})`
fix to skip Lastfm if the served data is bogus or empty 2019-04-29 09:29:50 +01:00			`try:`
			`data = self.fetch()`
			`tracks = self.extracttracks(data)`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`total = int(data.get("@attr").get("totalPages"))`
			`current = int(data.get("@attr").get("page"))`
fix to skip Lastfm if the served data is bogus or empty 2019-04-29 09:29:50 +01:00			`cntr = total - current`
			`except Exception as e:`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`logging.error("Something went wrong: %s", e)`
fix to skip Lastfm if the served data is bogus or empty 2019-04-29 09:29:50 +01:00			`return`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00
			`if not len(tracks):`
			`return`

			`while cntr > 0:`
			`current = current + 1`
			`cntr = total - current`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`logging.info("requesting page #%d of paginated results", current)`
			`self.params.update({"page": current})`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`data = self.fetch()`
			`tracks = tracks + self.extracttracks(data)`

			`if not self.exists:`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`with open(self.target, "w") as f:`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`writer = csv.DictWriter(f, fieldnames=Track._fields)`
			`writer.writeheader()`

			`if len(tracks):`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`with open(self.target, "a") as f:`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`writer = csv.writer(f, quoting=csv.QUOTE_NONNUMERIC)`
- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`writer.writerows(sorted(tracks, key=attrgetter("timestamp")))`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00

- formatting with black - added YAML files in case I ever want to use the saved favs as entries in my site - some tiny amount of code refactoring 2019-07-13 21:01:57 +01:00			`if __name__ == "__main__":`
initial release with LastFM, Flickr, Tumblr, DeviantArt support 2018-10-15 14:16:10 +01:00			`lfm = LastFM()`
			`lfm.run()`