Changeset - 606acf3a4446
[Not reviewed]
default
0 1 0
Laman - 7 years ago 2018-05-05 12:51:28

fix: timeToPeak ukazuje skutečné roky, ne kalendářní
1 file changed with 1 insertions and 1 deletions:
0 comments (0 inline, 0 general)
queries.py
Show inline comments
 
@@ -110,117 +110,117 @@ def populationStrength(year1,year2,count
 
	print("\r",end="",file=sys.stderr)
 

	
 
	print("Počty aktivních hráčů v {0} s uvedeným a vyšším ratingem".format(country))
 
	print("rating\t"+"\t".join(str(y) for y in range(year1,year2)))
 
	for rating in sorted(res.keys()):
 
		print(rating,end="\t")
 
		print("\t".join(str(res[rating].get(y,0)) for y in range(year1,year2)))
 

	
 

	
 
def _populationAge(year,country):
 
	"""Rozdělení populace země v daném roce podle doby hraní (celých let od prvního turnaje). Uvažují se pouze aktivní hráči."""
 
	date1=yearStart(year)
 
	date2=yearStart(year+1)
 
	query="""
 
		select date(?)-min_datum-1 as playing_years,count(pin)
 
			from (
 
				select ppt1.pin,min(ppt1.datum) as min_datum
 
					from players_performance_tournaments as ppt1
 
						join players_performance_tournaments as ppt2 on ppt1.pin=ppt2.pin
 
					where ppt2.datum>=date(?) and ppt2.datum<date(?) and ppt2.p_country_code=?
 
					group by ppt2.pin
 
			)
 
			group by playing_years
 
	"""
 
	return cursor.execute(query,(date2,date1,date2,country))
 

	
 

	
 
def populationAge(year1,year2,country):
 
	res=dict()
 

	
 
	for year in range(year1,year2):
 
		records=_populationAge(year,country)
 
		for (age,playerCount) in records:
 
			if age not in res:
 
				res[age]=dict()
 
			res[age][year]=playerCount
 
		print("\r",year,end="",file=sys.stderr)
 
	print("\r",end="",file=sys.stderr)
 

	
 
	print("Počty aktivních hráčů v {0} hrajících tolik a více let".format(country))
 
	print("roky hraní\t"+"\t".join(str(y) for y in range(year1,year2)))
 
	for age in sorted(res.keys()):
 
		print(age,end="\t")
 
		print("\t".join(str(res[age].get(y,0)) for y in range(year1,year2)))
 

	
 

	
 
def _tournamentAttendance(year):
 
	"""Návštěvnosti turnajů za daný rok, dělené podle země konání."""
 
	date1=yearStart(year)
 
	date2=yearStart(year+1)
 
	query="""select country_code,sum(player_count) from tournaments where datum>=date(?) and datum<date(?) group by country_code"""
 

	
 
	return cursor.execute(query,(date1,date2))
 

	
 

	
 
def tournamentAttendance(year1,year2):
 
	res=dict()
 

	
 
	for year in range(year1,year2):
 
		records=_tournamentAttendance(year)
 
		for (country,attendance) in records:
 
			if country not in res:
 
				res[country]=dict()
 
			res[country][year]=attendance
 
		print("\r",year,end="",file=sys.stderr)
 
	print("\r",end="",file=sys.stderr)
 

	
 
	print("Návštěvnosti (počty hráčů) na turnajích podle let")
 
	print("kód země\t"+"\t".join(str(y) for y in range(year1,year2)))
 
	for country in sorted(res.keys()):
 
		print(country,end="\t")
 
		print("\t".join(str(res[country].get(y,0)) for y in range(year1,year2)))
 

	
 

	
 
def fetchByRating(strongerThan,country=""):
 
	"""Hráči, kteří dosáhli rating strongerThan nebo vyšší, nepovinně filtrovaní podle země, seřazení od nejlepšího dosaženého ratingu."""
 
	query="""
 
		select pin,name,max(rating_after) as max_rating
 
			from players_performance natural join players
 
			where rating_after>=? and (?='' or country_code=?)
 
			group by pin
 
			order by max_rating desc"""
 

	
 
	res=cursor.execute(query,(strongerThan,country,country))
 
	print("pin\tjméno\tmax rating")
 
	for rec in res:
 
		print("\t".join([str(x) for x in rec]))
 

	
 

	
 
def timeToPeak():
 
	"""Jakého hráči dosáhli maximálního ratingu a jak dlouho jim to trvalo.
 

	
 
	Uvažuje hráče začínající s ratingem<=600 a s vrcholem před 1.1.2017."""
 
	# join on pin, max_rating může duplikovat řádky, když měl hráč stejný max_rating vícekrát.
 
	# proto ten ošklivý vnější group by :-ú
 
	query="""
 
		select subq.pin,min(min_rating),min(max_rating),min(_min_datum) as min_datum,min(datum) as peak_datum,min(datum)-min(_min_datum) as time_to_peak
 
		select subq.pin,min(min_rating),min(max_rating),min(_min_datum) as min_datum,min(datum) as peak_datum,(julianday(min(datum))-julianday(min(_min_datum)))/365.25 as time_to_peak
 
			from players_performance_tournaments as ppt
 
				join (select pin,min(rating_before) as min_rating,max(rating_after) as max_rating,min(datum) as _min_datum from players_performance_tournaments group by pin having min_rating<=600) as subq on ppt.pin=subq.pin and ppt.rating_after=max_rating
 
			group by ppt.pin
 
			having peak_datum<date('2017-01-01')
 
	"""
 

	
 
	res=cursor.execute(query)
 
	print("pin\tmin rating\tmax rating\tprvní turnaj\tdosažení max ratingu\troky k max ratingu")
 
	for rec in res:
 
		print("\t".join([str(x) for x in rec]))
 

	
 

	
 
# playerYear("Kotowski Jaroslav",2017)
 
# timeRank(2017,"CZ")
 
# yearsByCountry(2001,2018)
 
# populationStrength(2001,2018,"RU")
 
# populationAge(2001,2018,"RU")
 
# tournamentAttendance(2001,2018)
 
# fetchByRating(2600,"CZ")
 
# timeToPeak()
0 comments (0 inline, 0 general)