maloja/database.py

from bottle import route, run, template, static_file, request, response
from importlib.machinery import SourceFileLoader
import waitress
import os
import datetime
import cleanup
import sys


SCROBBLES = []	# Format: tuple(track_ref,timestamp,saved)
ARTISTS = []	# Format: artist
TRACKS = []	# Format: tuple(frozenset(artist_ref,...),title)


# by id
#def getScrobbleObject(o):
#	#return {"artists":getTrackObject(SCROBBLES[o][0])["artists"],"title":getTrackObject(SCROBBLES[o][0])["title"],"time":SCROBBLES[o][1],"saved":SCROBBLES[o][2]}
#	return {"artists":getTrackObject(SCROBBLES[o][0])["artists"],"title":getTrackObject(SCROBBLES[o][0])["title"],"time":SCROBBLES[o][1]}
#	
#def getArtistObject(o):
#	return ARTISTS[o]
#	
#def getTrackObject(o):
#	return {"artists":[getArtistObject(a) for a in TRACKS[o][0]],"title":TRACKS[o][1]}

# by object

def getScrobbleObject(o):
	track = getTrackObject(TRACKS[o[0]])
	return {"artists":track["artists"],"title":track["title"],"time":o[1]}
	
def getArtistObject(o):
	return o
	
def getTrackObject(o):
	artists = [getArtistObject(ARTISTS[a]) for a in o[0]]
	return {"artists":artists,"title":o[1]}


def createScrobble(artists,title,time):	
	i = getTrackID(artists,title)	
	obj = (i,time,False)
	SCROBBLES.append(obj)

def readScrobble(artists,title,time):	
	i = getTrackID(artists,title)	
	obj = (i,time,True)
	SCROBBLES.append(obj)

def getArtistID(name):

	obj = name
	try:
		i = ARTISTS.index(obj)
	except:
		i = len(ARTISTS)
		ARTISTS.append(obj)
	return i
			
def getTrackID(artists,title):
	artistset = set()
	for a in artists:
		artistset.add(getArtistID(name=a))
	obj = (frozenset(artistset),title)
	
	try:
		i = TRACKS.index(obj)
	except:
		i = len(TRACKS)
		TRACKS.append(obj)
	return i


@route("/scrobbles")
def get_scrobbles():
	keys = request.query
	r = db_query(artist=keys.get("artist"))

	return {"list":r} ##json can't be a list apparently???

@route("/tracks")
def get_tracks():
	artist = request.query.get("artist")
	
	# Option 1
	ls = [getTrackObject(t) for t in TRACKS if (artist in t[0]) or (artist==None)]
	
	# Option 2 is a bit more elegant but much slower
	#tracklist = [getTrackObject(t) for t in TRACKS]
	#ls = [t for t in tracklist if (artist in t["artists"]) or (artist==None)]
	
	return {"list":ls}
	
@route("/artists")
def get_artists():
	
	return {"list":ARTISTS}
	
@route("/charts")
def get_charts():
	since = request.query.get("since")
	to = request.query.get("to")
	
	#better do something here to sum up the totals on db level (before converting to dicts)
	
	#results = db_query(since=since,to=to)
	#return {"list":results}
	
@route("/newscrobble")
def post_scrobble():
	keys = request.query
	artists = keys.get("artist")
	title = keys.get("title")
	(artists,title) = cleanup.fullclean(artists,title)
	time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())
	
	## this is necessary for localhost testing
	response.set_header("Access-Control-Allow-Origin","*")
	
	createScrobble(artists,title,time)
	
	return ""
	
@route("/flush")
def abouttoshutdown():
	flush()
	print("Database saved to disk.")
	#sys.exit()

# Starts the server
def runserver(DATABASE_PORT):
	
	#reload()
	#buildh()
	build_db()

	run(host='0.0.0.0', port=DATABASE_PORT, server='waitress')


def build_db():
	
	global SCROBBLES
	
	SCROBBLESNEW = []
	for t in SCROBBLES:
		if not t[2]:
			SCROBBLESNEW.append(t)

	SCROBBLES = SCROBBLESNEW
	
	for f in os.listdir("logs/"):
		
		if not (".tsv" in f):
			continue
		
		logfile = open("logs/" + f)
		for l in logfile:
			
			l = l.replace("\n","")
			data = l.split("\t")
			
			## saving album in the scrobbles is supported, but for now we don't use it. It shouldn't be a defining part of the track (same song from Album or EP), but derived information
			artists = data[1].split("␟")
			#album = data[3]
			title = data[2]
			time = int(data[0])
			
			readScrobble(artists,title,time)
	
		
# builds database of artists and tracks
# UNUSED as it is very resource-heavy, use buildh() instead
def build():
	global ARTISTS
	global TRACKS
	
	artistlist = []
	tracklist = []
	for t in DATABASE:
		for a in t["artists"]:
			if a in artistlist:
				continue
			artistlist.append(a)
		
		# first check if the title exists at all to quickly rule out most titles	
		if (t["title"] in [tr["title"] for tr in tracklist]):
			#only it same title actually exists do we need to check if the song is the same
			
			
			if not (set(t["artists"]) in [set(tr["artists"]) for tr in tracklist if tr["title"] == t["title"]]): #wut
				tracklist.append({"artists":t["artists"],"title":t["title"]})
			
			### ALRIGHT
			#foundexisting = False
			#for track in [tr for tr in tracklist if tr["title"] == t["title"]]: #wtf did I just write
			#	#print("Check duplicate: " + str(track) + " AND " + str(t))
			#	if (set(track["artists"]) == set(t["artists"])):
			#		foundexisting = True
			#		#print("MATCH!")
			#		break
			#	#else:
			#		#print("NO MATCH!")
			#		
			#if not foundexisting:
			#	tracklist.append({"artists":t["artists"],"title":t["title"]})
		else:
			tracklist.append({"artists":t["artists"],"title":t["title"]})
		
		
	ARTISTS = artistlist
	TRACKS = tracklist


# builds database of artists and tracks
# uses better data types to quickly find all unique tracks
# now also UNUSED since we build everything in one step with build_db()
def buildh():
	global ARTISTS
	global TRACKS
	
	artistset = set()
	trackset = set()
	for t in DATABASE:
		for a in t["artists"]:
			#if a not in artistset:
			artistset.add(a)
		
		# we list the tracks as tupels of frozenset(artists) and track
		# this way they're hashable and easily comparable, but we need to change them back after we have the list		
		#if ((frozenset(t["artists"]),t["title"])) not in trackset:
		trackset.add((frozenset(t["artists"]),t["title"]))
			
	print("Done, now converting back!")
	
	ARTISTS = list(artistset)
	#TRACKS = [{"artists":list(a[0]),"title":a[1]} for a in trackset]
	#actually lets only convert this once we need it, kinda makes sense to store it in the tuple frozenset form
	TRACKS = list(trackset)


# Rebuilds the database from disk, keeps cached entries	
# unused, this is now done in build_db()
def reload():
	newdb = [t for t in DATABASE if not t["saved"]]
	
	for f in os.listdir("logs/"):
		#print(f)
		
		if not (".csv" in f):
			continue
		
		logfile = open("logs/" + f)
		for l in logfile:
			
			l = l.replace("\n","")
			data = l.split(",")
			#print(l)
			
			
			## saving album in the scrobbles is supported, but for now we don't use it. It shouldn't be a defining part of the track (same song from Album or EP), but derived information
			artists = data[1].split("/")
			#album = data[3]
			title = data[2]
			time = int(data[0])
			
			DATABASE.append({"artists":artists,"title":title,"time":time,"saved":True})

# Saves all cached entries to disk			
def flush():
	for s in SCROBBLES:
		if not s[2]:
			
			t = getScrobbleObject(s)
			
			artistss = "␟".join(t["artists"])
			timestamp = datetime.date.fromtimestamp(t["time"])
			
			entry = "\t".join([str(t["time"]),artistss,t["title"]])
		
			monthfile = open("logs/" + str(timestamp.year) + "_" + str(timestamp.month) + ".tsv","a")
			monthfile.write(entry)
			monthfile.write("\n")
			monthfile.close()
			
			t[2] = True
			

# Queries the database			
def db_query(artist=None,track=None,since=0,to=9999999999):
	if isinstance(since, str):
		sdate = [int(x) for x in since.split("/")]
		date = [1970,1,1,0,0]
		date[:len(sdate)] = sdate
		since = int(datetime.datetime(date[0],date[1],date[2],date[3],date[4],tzinfo=datetime.timezone.utc).timestamp())
	if isinstance(to, str):
		sdate = [int(x) for x in to.split("/")]
		date = [1970,1,1,0,0]
		date[:len(sdate)] = sdate
		to = int(datetime.datetime(date[0],date[1],date[2],date[3],date[4],tzinfo=datetime.timezone.utc).timestamp())
	
	# this is not meant as a search function. we *can* query the db with a string, but it only works if it matches exactly (and title string simply picks the first track with that name)	
	if isinstance(artist, str):
		artist = ARTISTS.index(artist)
	if isinstance(track, str):
		track = TRACKS.index(track)
	
	return [getScrobbleObject(s) for s in SCROBBLES if (s[0] == track or track==None) and (artist in TRACKS[s[0]][0] or artist==None) and (since < s[1] < to)]
	# pointless to check for artist when track is checked because every track has a fixed set of artists, but it's more elegant this way

		
	#thingsweneed = ["artists","title","time"]
	#return [{key:t[key] for key in thingsweneed} for t in DATABASE if (artist in t["artists"] or artist==None) and (t["title"]==title or title==None) and (since < t["time"] < to)]
	
# Search for strings
def db_search(query,type=None):
	if type=="ARTIST":
		results = []
		for a in ARTISTS:
			if query.lower() in a.lower():
				results.append(a)
	
	if type=="TRACK":
		results = []
		for t in TRACKS:
			if query.lower() in t[1].lower():
				results.append(t)
	
	return results
Initial commit 2018-11-24 18:29:24 +03:00			`from bottle import route, run, template, static_file, request, response`
			`from importlib.machinery import SourceFileLoader`
			`import waitress`
			`import os`
			`import datetime`
Added basic scrobbling function 2018-11-26 18:21:07 +03:00			`import cleanup`
Added basic scrobbler for Plex Web on Chromium/Vivaldi 2018-11-27 18:08:14 +03:00			`import sys`
Initial commit 2018-11-24 18:29:24 +03:00

Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`SCROBBLES = [] # Format: tuple(track_ref,timestamp,saved)`
			`ARTISTS = [] # Format: artist`
			`TRACKS = [] # Format: tuple(frozenset(artist_ref,...),title)`


			`# by id`
			`#def getScrobbleObject(o):`
			`# #return {"artists":getTrackObject(SCROBBLES[o][0])["artists"],"title":getTrackObject(SCROBBLES[o][0])["title"],"time":SCROBBLES[o][1],"saved":SCROBBLES[o][2]}`
			`# return {"artists":getTrackObject(SCROBBLES[o][0])["artists"],"title":getTrackObject(SCROBBLES[o][0])["title"],"time":SCROBBLES[o][1]}`
			`#`
			`#def getArtistObject(o):`
			`# return ARTISTS[o]`
			`#`
			`#def getTrackObject(o):`
			`# return {"artists":[getArtistObject(a) for a in TRACKS[o][0]],"title":TRACKS[o][1]}`

			`# by object`

			`def getScrobbleObject(o):`
			`track = getTrackObject(TRACKS[o[0]])`
			`return {"artists":track["artists"],"title":track["title"],"time":o[1]}`

			`def getArtistObject(o):`
			`return o`

			`def getTrackObject(o):`
			`artists = [getArtistObject(ARTISTS[a]) for a in o[0]]`
			`return {"artists":artists,"title":o[1]}`



			`def createScrobble(artists,title,time):`
			`i = getTrackID(artists,title)`
			`obj = (i,time,False)`
			`SCROBBLES.append(obj)`

			`def readScrobble(artists,title,time):`
			`i = getTrackID(artists,title)`
			`obj = (i,time,True)`
			`SCROBBLES.append(obj)`

			`def getArtistID(name):`

			`obj = name`
			`try:`
			`i = ARTISTS.index(obj)`
			`except:`
			`i = len(ARTISTS)`
			`ARTISTS.append(obj)`
			`return i`

			`def getTrackID(artists,title):`
			`artistset = set()`
			`for a in artists:`
			`artistset.add(getArtistID(name=a))`
			`obj = (frozenset(artistset),title)`

			`try:`
			`i = TRACKS.index(obj)`
			`except:`
			`i = len(TRACKS)`
			`TRACKS.append(obj)`
			`return i`
Initial commit 2018-11-24 18:29:24 +03:00

			`@route("/scrobbles")`
			`def get_scrobbles():`
			`keys = request.query`
			`r = db_query(artist=keys.get("artist"))`

Cleanup and some fixing 2018-11-25 21:31:03 +03:00			`return {"list":r} ##json can't be a list apparently???`
Initial commit 2018-11-24 18:29:24 +03:00
			`@route("/tracks")`
			`def get_tracks():`
			`artist = request.query.get("artist")`

Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`# Option 1`
			`ls = [getTrackObject(t) for t in TRACKS if (artist in t[0]) or (artist==None)]`

			`# Option 2 is a bit more elegant but much slower`
			`#tracklist = [getTrackObject(t) for t in TRACKS]`
			`#ls = [t for t in tracklist if (artist in t["artists"]) or (artist==None)]`

Expanding the code 2018-11-25 16:49:53 +03:00			`return {"list":ls}`

			`@route("/artists")`
			`def get_artists():`
Cleanup and some fixing 2018-11-25 21:31:03 +03:00
Expanding the code 2018-11-25 16:49:53 +03:00			`return {"list":ARTISTS}`

			`@route("/charts")`
			`def get_charts():`
			`since = request.query.get("since")`
			`to = request.query.get("to")`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`#better do something here to sum up the totals on db level (before converting to dicts)`

			`#results = db_query(since=since,to=to)`
			`#return {"list":results}`
Added basic scrobbling function 2018-11-26 18:21:07 +03:00
			`@route("/newscrobble")`
			`def post_scrobble():`
			`keys = request.query`
			`artists = keys.get("artist")`
			`title = keys.get("title")`
			`(artists,title) = cleanup.fullclean(artists,title)`
			`time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())`

Added basic scrobbler for Plex Web on Chromium/Vivaldi 2018-11-27 18:08:14 +03:00			`## this is necessary for localhost testing`
			`response.set_header("Access-Control-Allow-Origin","*")`

Added basic scrobbling function 2018-11-26 18:21:07 +03:00			`createScrobble(artists,title,time)`
Added basic scrobbler for Plex Web on Chromium/Vivaldi 2018-11-27 18:08:14 +03:00
			`return ""`

			`@route("/flush")`
			`def abouttoshutdown():`
			`flush()`
			`print("Database saved to disk.")`
			`#sys.exit()`
Initial commit 2018-11-24 18:29:24 +03:00
			`# Starts the server`
			`def runserver(DATABASE_PORT):`

Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`#reload()`
			`#buildh()`
			`build_db()`
Initial commit 2018-11-24 18:29:24 +03:00
			`run(host='0.0.0.0', port=DATABASE_PORT, server='waitress')`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00

			`def build_db():`
Initial commit 2018-11-24 18:29:24 +03:00
Cleanup and some fixing 2018-11-25 21:31:03 +03:00			`global SCROBBLES`

			`SCROBBLESNEW = []`
			`for t in SCROBBLES:`
			`if not t[2]:`
			`SCROBBLESNEW.append(t)`

			`SCROBBLES = SCROBBLESNEW`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`for f in os.listdir("logs/"):`

Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`if not (".tsv" in f):`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`continue`

			`logfile = open("logs/" + f)`
			`for l in logfile:`

			`l = l.replace("\n","")`
Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`data = l.split("\t")`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`## saving album in the scrobbles is supported, but for now we don't use it. It shouldn't be a defining part of the track (same song from Album or EP), but derived information`
Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`artists = data[1].split("␟")`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`#album = data[3]`
			`title = data[2]`
			`time = int(data[0])`

			`readScrobble(artists,title,time)`


Initial commit 2018-11-24 18:29:24 +03:00
			`# builds database of artists and tracks`
			`# UNUSED as it is very resource-heavy, use buildh() instead`
			`def build():`
			`global ARTISTS`
			`global TRACKS`

			`artistlist = []`
			`tracklist = []`
			`for t in DATABASE:`
			`for a in t["artists"]:`
			`if a in artistlist:`
			`continue`
			`artistlist.append(a)`

			`# first check if the title exists at all to quickly rule out most titles`
			`if (t["title"] in [tr["title"] for tr in tracklist]):`
			`#only it same title actually exists do we need to check if the song is the same`


			`if not (set(t["artists"]) in [set(tr["artists"]) for tr in tracklist if tr["title"] == t["title"]]): #wut`
			`tracklist.append({"artists":t["artists"],"title":t["title"]})`

			`### ALRIGHT`
			`#foundexisting = False`
			`#for track in [tr for tr in tracklist if tr["title"] == t["title"]]: #wtf did I just write`
			`# #print("Check duplicate: " + str(track) + " AND " + str(t))`
			`# if (set(track["artists"]) == set(t["artists"])):`
			`# foundexisting = True`
			`# #print("MATCH!")`
			`# break`
			`# #else:`
			`# #print("NO MATCH!")`
Expanding the code 2018-11-25 16:49:53 +03:00			`#`
Initial commit 2018-11-24 18:29:24 +03:00			`#if not foundexisting:`
			`# tracklist.append({"artists":t["artists"],"title":t["title"]})`
			`else:`
			`tracklist.append({"artists":t["artists"],"title":t["title"]})`


			`ARTISTS = artistlist`
			`TRACKS = tracklist`


			`# builds database of artists and tracks`
			`# uses better data types to quickly find all unique tracks`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`# now also UNUSED since we build everything in one step with build_db()`
Initial commit 2018-11-24 18:29:24 +03:00			`def buildh():`
			`global ARTISTS`
			`global TRACKS`

			`artistset = set()`
			`trackset = set()`
			`for t in DATABASE:`
			`for a in t["artists"]:`
Expanding the code 2018-11-25 16:49:53 +03:00			`#if a not in artistset:`
			`artistset.add(a)`
Initial commit 2018-11-24 18:29:24 +03:00
			`# we list the tracks as tupels of frozenset(artists) and track`
			`# this way they're hashable and easily comparable, but we need to change them back after we have the list`
Expanding the code 2018-11-25 16:49:53 +03:00			`#if ((frozenset(t["artists"]),t["title"])) not in trackset:`
			`trackset.add((frozenset(t["artists"]),t["title"]))`
Initial commit 2018-11-24 18:29:24 +03:00
			`print("Done, now converting back!")`

			`ARTISTS = list(artistset)`
Expanding the code 2018-11-25 16:49:53 +03:00			`#TRACKS = [{"artists":list(a[0]),"title":a[1]} for a in trackset]`
			`#actually lets only convert this once we need it, kinda makes sense to store it in the tuple frozenset form`
			`TRACKS = list(trackset)`

Initial commit 2018-11-24 18:29:24 +03:00
			`# Rebuilds the database from disk, keeps cached entries`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`# unused, this is now done in build_db()`
Initial commit 2018-11-24 18:29:24 +03:00			`def reload():`
			`newdb = [t for t in DATABASE if not t["saved"]]`

			`for f in os.listdir("logs/"):`
			`#print(f)`

			`if not (".csv" in f):`
			`continue`

			`logfile = open("logs/" + f)`
			`for l in logfile:`

			`l = l.replace("\n","")`
			`data = l.split(",")`
			`#print(l)`

Expanding the code 2018-11-25 16:49:53 +03:00
			`## saving album in the scrobbles is supported, but for now we don't use it. It shouldn't be a defining part of the track (same song from Album or EP), but derived information`
Initial commit 2018-11-24 18:29:24 +03:00			`artists = data[1].split("/")`
			`#album = data[3]`
			`title = data[2]`
			`time = int(data[0])`

			`DATABASE.append({"artists":artists,"title":title,"time":time,"saved":True})`

			`# Saves all cached entries to disk`
			`def flush():`
Cleanup and some fixing 2018-11-25 21:31:03 +03:00			`for s in SCROBBLES:`
			`if not s[2]:`

			`t = getScrobbleObject(s)`

Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`artistss = "␟".join(t["artists"])`
Initial commit 2018-11-24 18:29:24 +03:00			`timestamp = datetime.date.fromtimestamp(t["time"])`

Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`entry = "\t".join([str(t["time"]),artistss,t["title"]])`
Initial commit 2018-11-24 18:29:24 +03:00
Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`monthfile = open("logs/" + str(timestamp.year) + "_" + str(timestamp.month) + ".tsv","a")`
Initial commit 2018-11-24 18:29:24 +03:00			`monthfile.write(entry)`
			`monthfile.write("\n")`
			`monthfile.close()`

Cleanup and some fixing 2018-11-25 21:31:03 +03:00			`t[2] = True`
Initial commit 2018-11-24 18:29:24 +03:00

			`# Queries the database`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`def db_query(artist=None,track=None,since=0,to=9999999999):`
Initial commit 2018-11-24 18:29:24 +03:00			`if isinstance(since, str):`
			`sdate = [int(x) for x in since.split("/")]`
			`date = [1970,1,1,0,0]`
			`date[:len(sdate)] = sdate`
			`since = int(datetime.datetime(date[0],date[1],date[2],date[3],date[4],tzinfo=datetime.timezone.utc).timestamp())`
			`if isinstance(to, str):`
			`sdate = [int(x) for x in to.split("/")]`
			`date = [1970,1,1,0,0]`
			`date[:len(sdate)] = sdate`
			`to = int(datetime.datetime(date[0],date[1],date[2],date[3],date[4],tzinfo=datetime.timezone.utc).timestamp())`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`# this is not meant as a search function. we can query the db with a string, but it only works if it matches exactly (and title string simply picks the first track with that name)`
			`if isinstance(artist, str):`
			`artist = ARTISTS.index(artist)`
			`if isinstance(track, str):`
			`track = TRACKS.index(track)`

			`return [getScrobbleObject(s) for s in SCROBBLES if (s[0] == track or track==None) and (artist in TRACKS[s[0]][0] or artist==None) and (since < s[1] < to)]`
			`# pointless to check for artist when track is checked because every track has a fixed set of artists, but it's more elegant this way`

Initial commit 2018-11-24 18:29:24 +03:00
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`#thingsweneed = ["artists","title","time"]`
			`#return [{key:t[key] for key in thingsweneed} for t in DATABASE if (artist in t["artists"] or artist==None) and (t["title"]==title or title==None) and (since < t["time"] < to)]`
Initial commit 2018-11-24 18:29:24 +03:00
			`# Search for strings`
			`def db_search(query,type=None):`
			`if type=="ARTIST":`
			`results = []`
			`for a in ARTISTS:`
			`if query.lower() in a.lower():`
			`results.append(a)`

			`if type=="TRACK":`
			`results = []`
			`for t in TRACKS:`
			`if query.lower() in t[1].lower():`
			`results.append(t)`

			`return results`