maloja/database.py

from bottle import route, get, post, run, template, static_file, request, response, FormsDict
from importlib.machinery import SourceFileLoader
import urllib
import waitress
import os
import datetime
from cleanup import *
from utilities import *
import sys


SCROBBLES = []	# Format: tuple(track_ref,timestamp,saved)
ARTISTS = []	# Format: artist
TRACKS = []	# Format: tuple(frozenset(artist_ref,...),title)

timestamps = set()

c = CleanerAgent()
clients = []

lastsync = 0


### symmetric keys are fine for now since we hopefully use HTTPS
def loadAPIkeys():
	global clients
	createTSV("clients/authenticated_machines.tsv")
	clients = parseTSV("clients/authenticated_machines.tsv","string","string")

def checkAPIkey(k):
	return (k in [k for [k,d] in clients])

def getScrobbleObject(o):
	track = getTrackObject(TRACKS[o[0]])
	return {"artists":track["artists"],"title":track["title"],"time":o[1]}
	
def getArtistObject(o):
	return o
	
def getTrackObject(o):
	artists = [getArtistObject(ARTISTS[a]) for a in o[0]]
	return {"artists":artists,"title":o[1]}


def createScrobble(artists,title,time):
	while (time in timestamps):
		time += 1
	timestamps.add(time)
	i = getTrackID(artists,title)
	obj = (i,time,False)
	SCROBBLES.append(obj)

def readScrobble(artists,title,time):
	while (time in timestamps):
		time += 1
	timestamps.add(time)
	i = getTrackID(artists,title)
	obj = (i,time,True)
	SCROBBLES.append(obj)

def getArtistID(name):

	obj = name
	try:
		i = ARTISTS.index(obj)
	except:
		i = len(ARTISTS)
		ARTISTS.append(obj)
	return i
			
def getTrackID(artists,title):
	artistset = set()
	for a in artists:
		artistset.add(getArtistID(name=a))
	obj = (frozenset(artistset),title)
	
	try:
		i = TRACKS.index(obj)
	except:
		i = len(TRACKS)
		TRACKS.append(obj)
	return i


@route("/scrobbles")
def get_scrobbles():
	keys = request.query
	r = db_query(artist=keys.get("artist"),track=keys.get("track"),since=keys.get("since"),to=keys.get("to"))

	return {"list":r} ##json can't be a list apparently???

@route("/tracks")
def get_tracks():
	artist = request.query.get("artist")
	
	if artist is not None:
		artistid = ARTISTS.index(artist)
	
	# Option 1
	ls = [getTrackObject(t) for t in TRACKS if (artistid in t[0]) or (artistid==None)]
	
	# Option 2 is a bit more elegant but much slower
	#tracklist = [getTrackObject(t) for t in TRACKS]
	#ls = [t for t in tracklist if (artist in t["artists"]) or (artist==None)]
	
	return {"list":ls}
	
@route("/artists")
def get_artists():
	
	return {"list":ARTISTS}
	
@route("/charts")
def get_charts():
	since = request.query.get("since")
	to = request.query.get("to")
	
	#better do something here to sum up the totals on db level (before converting to dicts)
	
	#results = db_query(since=since,to=to)
	#return {"list":results}
	
@get("/newscrobble")
def pseudo_post_scrobble():
	keys = FormsDict.decode(request.query) # The Dal★Shabet handler
	artists = keys.get("artist")
	title = keys.get("title")
	try:
		time = int(keys.get("time"))
	except:
		time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())
	(artists,title) = c.fullclean(artists,title)

	## this is necessary for localhost testing
	response.set_header("Access-Control-Allow-Origin","*")
	
	createScrobble(artists,title,time)
	
	if (time - lastsync) > 3600:
		sync()
	
	return ""
	
@post("/newscrobble")
def post_scrobble():
	keys = FormsDict.decode(request.forms) # The Dal★Shabet handler
	artists = keys.get("artist")
	title = keys.get("title")
	apikey = keys.get("key")
	if not (checkAPIkey(apikey)):
		response.status = 403
		return ""
	
	try:
		time = int(keys.get("time"))
	except:
		time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())
	(artists,title) = c.fullclean(artists,title)

	## this is necessary for localhost testing
	response.set_header("Access-Control-Allow-Origin","*")
	
	createScrobble(artists,title,time)
	
	if (time - lastsync) > 3600:
		sync()
	
	return ""
	
@route("/sync")
def abouttoshutdown():
	sync()
	#sys.exit()

# Starts the server
def runserver(DATABASE_PORT):
	global lastsync
	lastsync = time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())
	#reload()
	#buildh()
	build_db()

	loadAPIkeys()

	run(host='0.0.0.0', port=DATABASE_PORT, server='waitress')


def build_db():
	
	global SCROBBLES
	
	SCROBBLESNEW = []
	for t in SCROBBLES:
		if not t[2]:
			SCROBBLESNEW.append(t)

	SCROBBLES = SCROBBLESNEW
	
	for f in os.listdir("logs/"):
		
		if not (".tsv" in f):
			continue
		
		logfile = open("logs/" + f)
		for l in logfile:
			
			l = l.replace("\n","")
			data = l.split("\t")
			
			## saving album in the scrobbles is supported, but for now we don't use it. It shouldn't be a defining part of the track (same song from Album or EP), but derived information
			artists = data[1].split("␟")
			#album = data[3]
			title = data[2]
			time = int(data[0])
			
			readScrobble(artists,title,time)
	
		
# Saves all cached entries to disk			
def sync():
	for idx in range(len(SCROBBLES)):
		if not SCROBBLES[idx][2]:
			
			t = getScrobbleObject(SCROBBLES[idx])
			
			artistss = "␟".join(t["artists"])
			timestamp = datetime.date.fromtimestamp(t["time"])
			
			entry = "\t".join([str(t["time"]),artistss,t["title"]])
		
			monthfile = open("logs/" + str(timestamp.year) + "_" + str(timestamp.month) + ".tsv","a")
			monthfile.write(entry)
			monthfile.write("\n")
			monthfile.close()
			
			SCROBBLES[idx] = (SCROBBLES[idx][0],SCROBBLES[idx][1],True)
			
	global lastsync
	lastsync = time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())
	print("Database saved to disk.")
			

# Queries the database			
def db_query(artist=None,track=None,since=0,to=9999999999):
	if isinstance(since, str):
		sdate = [int(x) for x in since.split("/")]
		date = [1970,1,1,0,0]
		date[:len(sdate)] = sdate
		since = int(datetime.datetime(date[0],date[1],date[2],date[3],date[4],tzinfo=datetime.timezone.utc).timestamp())
	if isinstance(to, str):
		sdate = [int(x) for x in to.split("/")]
		date = [1970,1,1,0,0]
		date[:len(sdate)] = sdate
		to = int(datetime.datetime(date[0],date[1],date[2],date[3],date[4],tzinfo=datetime.timezone.utc).timestamp())
		
	if (since==None):
		since = 0
	if (to==None):
		to = 9999999999
	
	# this is not meant as a search function. we *can* query the db with a string, but it only works if it matches exactly (and title string simply picks the first track with that name)	
	if isinstance(artist, str):
		artist = ARTISTS.index(artist)
	if isinstance(track, str):
		track = TRACKS.index(track)
	
	return [getScrobbleObject(s) for s in SCROBBLES if (s[0] == track or track==None) and (artist in TRACKS[s[0]][0] or artist==None) and (since < s[1] < to)]
	# pointless to check for artist when track is checked because every track has a fixed set of artists, but it's more elegant this way

		
	#thingsweneed = ["artists","title","time"]
	#return [{key:t[key] for key in thingsweneed} for t in DATABASE if (artist in t["artists"] or artist==None) and (t["title"]==title or title==None) and (since < t["time"] < to)]
	
# Search for strings
def db_search(query,type=None):
	if type=="ARTIST":
		results = []
		for a in ARTISTS:
			if query.lower() in a.lower():
				results.append(a)
	
	if type=="TRACK":
		results = []
		for t in TRACKS:
			if query.lower() in t[1].lower():
				results.append(t)
	
	return results
Implemented scrobbling via POST 2018-11-30 15:39:12 +03:00			`from bottle import route, get, post, run, template, static_file, request, response, FormsDict`
Initial commit 2018-11-24 18:29:24 +03:00			`from importlib.machinery import SourceFileLoader`
Can now scrobble Dal★Shabet 2018-11-27 21:05:50 +03:00			`import urllib`
Initial commit 2018-11-24 18:29:24 +03:00			`import waitress`
			`import os`
			`import datetime`
Implemented custom rules 2018-11-28 19:45:52 +03:00			`from cleanup import *`
Added simple API key 2018-11-30 17:44:30 +03:00			`from utilities import *`
Added basic scrobbler for Plex Web on Chromium/Vivaldi 2018-11-27 18:08:14 +03:00			`import sys`
Initial commit 2018-11-24 18:29:24 +03:00

Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`SCROBBLES = [] # Format: tuple(track_ref,timestamp,saved)`
			`ARTISTS = [] # Format: artist`
			`TRACKS = [] # Format: tuple(frozenset(artist_ref,...),title)`

Timestamps are now unique identifiers of a scrobble 2018-11-29 18:05:44 +03:00			`timestamps = set()`

Implemented custom rules 2018-11-28 19:45:52 +03:00			`c = CleanerAgent()`
Added simple API key 2018-11-30 17:44:30 +03:00			`clients = []`
Implemented custom rules 2018-11-28 19:45:52 +03:00
Added regular database sync 2018-11-28 15:02:43 +03:00			`lastsync = 0`

Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
Added simple API key 2018-11-30 17:44:30 +03:00			`### symmetric keys are fine for now since we hopefully use HTTPS`
			`def loadAPIkeys():`
			`global clients`
Some fixing 2018-11-30 18:01:32 +03:00			`createTSV("clients/authenticated_machines.tsv")`
Added simple API key 2018-11-30 17:44:30 +03:00			`clients = parseTSV("clients/authenticated_machines.tsv","string","string")`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
Added simple API key 2018-11-30 17:44:30 +03:00			`def checkAPIkey(k):`
			`return (k in [k for [k,d] in clients])`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`def getScrobbleObject(o):`
			`track = getTrackObject(TRACKS[o[0]])`
			`return {"artists":track["artists"],"title":track["title"],"time":o[1]}`

			`def getArtistObject(o):`
			`return o`

			`def getTrackObject(o):`
			`artists = [getArtistObject(ARTISTS[a]) for a in o[0]]`
			`return {"artists":artists,"title":o[1]}`



Timestamps are now unique identifiers of a scrobble 2018-11-29 18:05:44 +03:00			`def createScrobble(artists,title,time):`
			`while (time in timestamps):`
			`time += 1`
Whoops 2018-11-29 18:09:46 +03:00			`timestamps.add(time)`
Timestamps are now unique identifiers of a scrobble 2018-11-29 18:05:44 +03:00			`i = getTrackID(artists,title)`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`obj = (i,time,False)`
			`SCROBBLES.append(obj)`

Timestamps are now unique identifiers of a scrobble 2018-11-29 18:05:44 +03:00			`def readScrobble(artists,title,time):`
			`while (time in timestamps):`
			`time += 1`
Whoops 2018-11-29 18:09:46 +03:00			`timestamps.add(time)`
Timestamps are now unique identifiers of a scrobble 2018-11-29 18:05:44 +03:00			`i = getTrackID(artists,title)`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`obj = (i,time,True)`
			`SCROBBLES.append(obj)`

			`def getArtistID(name):`

			`obj = name`
			`try:`
			`i = ARTISTS.index(obj)`
			`except:`
			`i = len(ARTISTS)`
			`ARTISTS.append(obj)`
			`return i`

			`def getTrackID(artists,title):`
			`artistset = set()`
			`for a in artists:`
			`artistset.add(getArtistID(name=a))`
			`obj = (frozenset(artistset),title)`

			`try:`
			`i = TRACKS.index(obj)`
			`except:`
			`i = len(TRACKS)`
			`TRACKS.append(obj)`
			`return i`
Initial commit 2018-11-24 18:29:24 +03:00

			`@route("/scrobbles")`
			`def get_scrobbles():`
			`keys = request.query`
Small fixes 2018-11-27 18:21:33 +03:00			`r = db_query(artist=keys.get("artist"),track=keys.get("track"),since=keys.get("since"),to=keys.get("to"))`
Initial commit 2018-11-24 18:29:24 +03:00
Cleanup and some fixing 2018-11-25 21:31:03 +03:00			`return {"list":r} ##json can't be a list apparently???`
Initial commit 2018-11-24 18:29:24 +03:00
			`@route("/tracks")`
			`def get_tracks():`
			`artist = request.query.get("artist")`

Implemented scrobbling via POST 2018-11-30 15:39:12 +03:00			`if artist is not None:`
			`artistid = ARTISTS.index(artist)`
Minor fixes 2018-11-28 20:44:33 +03:00
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`# Option 1`
Minor fixes 2018-11-28 20:44:33 +03:00			`ls = [getTrackObject(t) for t in TRACKS if (artistid in t[0]) or (artistid==None)]`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`# Option 2 is a bit more elegant but much slower`
			`#tracklist = [getTrackObject(t) for t in TRACKS]`
			`#ls = [t for t in tracklist if (artist in t["artists"]) or (artist==None)]`

Expanding the code 2018-11-25 16:49:53 +03:00			`return {"list":ls}`

			`@route("/artists")`
			`def get_artists():`
Cleanup and some fixing 2018-11-25 21:31:03 +03:00
Expanding the code 2018-11-25 16:49:53 +03:00			`return {"list":ARTISTS}`

			`@route("/charts")`
			`def get_charts():`
			`since = request.query.get("since")`
			`to = request.query.get("to")`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`#better do something here to sum up the totals on db level (before converting to dicts)`

			`#results = db_query(since=since,to=to)`
			`#return {"list":results}`
Added basic scrobbling function 2018-11-26 18:21:07 +03:00
Implemented scrobbling via POST 2018-11-30 15:39:12 +03:00			`@get("/newscrobble")`
			`def pseudo_post_scrobble():`
Can now scrobble Dal★Shabet 2018-11-27 21:05:50 +03:00			`keys = FormsDict.decode(request.query) # The Dal★Shabet handler`
Added basic scrobbling function 2018-11-26 18:21:07 +03:00			`artists = keys.get("artist")`
			`title = keys.get("title")`
Implemented custom rules 2018-11-28 19:45:52 +03:00			`try:`
			`time = int(keys.get("time"))`
			`except:`
Improved artist / title parsing 2018-11-28 17:33:30 +03:00			`time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())`
Implemented custom rules 2018-11-28 19:45:52 +03:00			`(artists,title) = c.fullclean(artists,title)`

Added basic scrobbler for Plex Web on Chromium/Vivaldi 2018-11-27 18:08:14 +03:00			`## this is necessary for localhost testing`
			`response.set_header("Access-Control-Allow-Origin","*")`

Added basic scrobbling function 2018-11-26 18:21:07 +03:00			`createScrobble(artists,title,time)`
Added basic scrobbler for Plex Web on Chromium/Vivaldi 2018-11-27 18:08:14 +03:00
Added regular database sync 2018-11-28 15:02:43 +03:00			`if (time - lastsync) > 3600:`
			`sync()`

Added basic scrobbler for Plex Web on Chromium/Vivaldi 2018-11-27 18:08:14 +03:00			`return ""`

Implemented scrobbling via POST 2018-11-30 15:39:12 +03:00			`@post("/newscrobble")`
			`def post_scrobble():`
			`keys = FormsDict.decode(request.forms) # The Dal★Shabet handler`
			`artists = keys.get("artist")`
			`title = keys.get("title")`
Added simple API key 2018-11-30 17:44:30 +03:00			`apikey = keys.get("key")`
			`if not (checkAPIkey(apikey)):`
			`response.status = 403`
			`return ""`

Implemented scrobbling via POST 2018-11-30 15:39:12 +03:00			`try:`
			`time = int(keys.get("time"))`
			`except:`
			`time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())`
			`(artists,title) = c.fullclean(artists,title)`

			`## this is necessary for localhost testing`
			`response.set_header("Access-Control-Allow-Origin","*")`

			`createScrobble(artists,title,time)`

			`if (time - lastsync) > 3600:`
			`sync()`

			`return ""`

Added regular database sync 2018-11-28 15:02:43 +03:00			`@route("/sync")`
Added basic scrobbler for Plex Web on Chromium/Vivaldi 2018-11-27 18:08:14 +03:00			`def abouttoshutdown():`
Added regular database sync 2018-11-28 15:02:43 +03:00			`sync()`
Added basic scrobbler for Plex Web on Chromium/Vivaldi 2018-11-27 18:08:14 +03:00			`#sys.exit()`
Initial commit 2018-11-24 18:29:24 +03:00
			`# Starts the server`
			`def runserver(DATABASE_PORT):`
Added regular database sync 2018-11-28 15:02:43 +03:00			`global lastsync`
			`lastsync = time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`#reload()`
			`#buildh()`
			`build_db()`
Initial commit 2018-11-24 18:29:24 +03:00
Added simple API key 2018-11-30 17:44:30 +03:00			`loadAPIkeys()`

Initial commit 2018-11-24 18:29:24 +03:00			`run(host='0.0.0.0', port=DATABASE_PORT, server='waitress')`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00

			`def build_db():`
Initial commit 2018-11-24 18:29:24 +03:00
Cleanup and some fixing 2018-11-25 21:31:03 +03:00			`global SCROBBLES`

			`SCROBBLESNEW = []`
			`for t in SCROBBLES:`
			`if not t[2]:`
			`SCROBBLESNEW.append(t)`

			`SCROBBLES = SCROBBLESNEW`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`for f in os.listdir("logs/"):`

Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`if not (".tsv" in f):`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`continue`

			`logfile = open("logs/" + f)`
			`for l in logfile:`

			`l = l.replace("\n","")`
Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`data = l.split("\t")`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`## saving album in the scrobbles is supported, but for now we don't use it. It shouldn't be a defining part of the track (same song from Album or EP), but derived information`
Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`artists = data[1].split("␟")`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`#album = data[3]`
			`title = data[2]`
			`time = int(data[0])`

			`readScrobble(artists,title,time)`


Initial commit 2018-11-24 18:29:24 +03:00

			`# Saves all cached entries to disk`
Added regular database sync 2018-11-28 15:02:43 +03:00			`def sync():`
Can now scrobble Dal★Shabet 2018-11-27 21:05:50 +03:00			`for idx in range(len(SCROBBLES)):`
			`if not SCROBBLES[idx][2]:`
Cleanup and some fixing 2018-11-25 21:31:03 +03:00
Can now scrobble Dal★Shabet 2018-11-27 21:05:50 +03:00			`t = getScrobbleObject(SCROBBLES[idx])`
Cleanup and some fixing 2018-11-25 21:31:03 +03:00
Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`artistss = "␟".join(t["artists"])`
Initial commit 2018-11-24 18:29:24 +03:00			`timestamp = datetime.date.fromtimestamp(t["time"])`

Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`entry = "\t".join([str(t["time"]),artistss,t["title"]])`
Initial commit 2018-11-24 18:29:24 +03:00
Switched to better delimiters (tab and ASCII31) 2018-11-26 14:55:17 +03:00			`monthfile = open("logs/" + str(timestamp.year) + "_" + str(timestamp.month) + ".tsv","a")`
Initial commit 2018-11-24 18:29:24 +03:00			`monthfile.write(entry)`
			`monthfile.write("\n")`
			`monthfile.close()`

Can now scrobble Dal★Shabet 2018-11-27 21:05:50 +03:00			`SCROBBLES[idx] = (SCROBBLES[idx][0],SCROBBLES[idx][1],True)`
Initial commit 2018-11-24 18:29:24 +03:00
Added regular database sync 2018-11-28 15:02:43 +03:00			`global lastsync`
			`lastsync = time = int(datetime.datetime.now(tz=datetime.timezone.utc).timestamp())`
Improved artist / title parsing 2018-11-28 17:33:30 +03:00			`print("Database saved to disk.")`
Added regular database sync 2018-11-28 15:02:43 +03:00
Initial commit 2018-11-24 18:29:24 +03:00
			`# Queries the database`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`def db_query(artist=None,track=None,since=0,to=9999999999):`
Initial commit 2018-11-24 18:29:24 +03:00			`if isinstance(since, str):`
			`sdate = [int(x) for x in since.split("/")]`
			`date = [1970,1,1,0,0]`
			`date[:len(sdate)] = sdate`
			`since = int(datetime.datetime(date[0],date[1],date[2],date[3],date[4],tzinfo=datetime.timezone.utc).timestamp())`
			`if isinstance(to, str):`
			`sdate = [int(x) for x in to.split("/")]`
			`date = [1970,1,1,0,0]`
			`date[:len(sdate)] = sdate`
			`to = int(datetime.datetime(date[0],date[1],date[2],date[3],date[4],tzinfo=datetime.timezone.utc).timestamp())`
Small fixes 2018-11-27 18:21:33 +03:00
			`if (since==None):`
			`since = 0`
			`if (to==None):`
			`to = 9999999999`
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00
			`# this is not meant as a search function. we can query the db with a string, but it only works if it matches exactly (and title string simply picks the first track with that name)`
			`if isinstance(artist, str):`
			`artist = ARTISTS.index(artist)`
			`if isinstance(track, str):`
			`track = TRACKS.index(track)`

			`return [getScrobbleObject(s) for s in SCROBBLES if (s[0] == track or track==None) and (artist in TRACKS[s[0]][0] or artist==None) and (since < s[1] < to)]`
			`# pointless to check for artist when track is checked because every track has a fixed set of artists, but it's more elegant this way`

Initial commit 2018-11-24 18:29:24 +03:00
Major restructuring of the database from dicts to tuples 2018-11-25 20:17:14 +03:00			`#thingsweneed = ["artists","title","time"]`
			`#return [{key:t[key] for key in thingsweneed} for t in DATABASE if (artist in t["artists"] or artist==None) and (t["title"]==title or title==None) and (since < t["time"] < to)]`
Initial commit 2018-11-24 18:29:24 +03:00
			`# Search for strings`
			`def db_search(query,type=None):`
			`if type=="ARTIST":`
			`results = []`
			`for a in ARTISTS:`
			`if query.lower() in a.lower():`
			`results.append(a)`

			`if type=="TRACK":`
			`results = []`
			`for t in TRACKS:`
			`if query.lower() in t[1].lower():`
			`results.append(t)`

			`return results`