mirror of
https://github.com/ae-utbm/sith.git
synced 2024-11-16 03:03:21 +00:00
379 lines
13 KiB
Python
379 lines
13 KiB
Python
|
# -*- coding:utf-8 -*
|
||
|
#
|
||
|
# Copyright 2023
|
||
|
# - Skia <skia@hya.sk>
|
||
|
#
|
||
|
# Ce fichier fait partie du site de l'Association des Étudiants de l'UTBM,
|
||
|
# http://ae.utbm.fr.
|
||
|
#
|
||
|
# This program is free software; you can redistribute it and/or modify it under
|
||
|
# the terms of the GNU General Public License a published by the Free Software
|
||
|
# Foundation; either version 3 of the License, or (at your option) any later
|
||
|
# version.
|
||
|
#
|
||
|
# This program is distributed in the hope that it will be useful, but WITHOUT
|
||
|
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
||
|
# FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
|
||
|
# details.
|
||
|
#
|
||
|
# You should have received a copy of the GNU General Public License along with
|
||
|
# this program; if not, write to the Free Sofware Foundation, Inc., 59 Temple
|
||
|
# Place - Suite 330, Boston, MA 02111-1307, USA.
|
||
|
#
|
||
|
#
|
||
|
|
||
|
import math
|
||
|
import logging
|
||
|
|
||
|
from typing import Tuple
|
||
|
from django.db import models
|
||
|
from django.db.models import Q, Case, F, Value, When, Count
|
||
|
from django.db.models.functions import Concat
|
||
|
from django.utils import timezone
|
||
|
from django.utils.translation import gettext_lazy as _
|
||
|
from typing import List, TypedDict
|
||
|
|
||
|
from core.models import User
|
||
|
from club.models import Club
|
||
|
from sas.models import Picture
|
||
|
|
||
|
|
||
|
class GalaxyStar(models.Model):
|
||
|
"""
|
||
|
This class defines a star (vertex -> user) in the galaxy graph, storing a reference to its owner citizen, and being
|
||
|
referenced by GalaxyLane.
|
||
|
|
||
|
It also stores the individual mass of this star, used to push it towards the center of the galaxy.
|
||
|
"""
|
||
|
|
||
|
owner = models.OneToOneField(
|
||
|
User,
|
||
|
verbose_name=_("star owner"),
|
||
|
related_name="galaxy_user",
|
||
|
on_delete=models.CASCADE,
|
||
|
)
|
||
|
mass = models.PositiveIntegerField(
|
||
|
_("star mass"),
|
||
|
default=0,
|
||
|
)
|
||
|
|
||
|
def __str__(self):
|
||
|
return str(self.owner)
|
||
|
|
||
|
|
||
|
class GalaxyLane(models.Model):
|
||
|
"""
|
||
|
This class defines a lane (edge -> link between galaxy citizen) in the galaxy map, storing a reference to both its
|
||
|
ends and the distance it covers.
|
||
|
Score details between citizen owning the stars is also stored here.
|
||
|
"""
|
||
|
|
||
|
star1 = models.ForeignKey(
|
||
|
GalaxyStar,
|
||
|
verbose_name=_("galaxy star 1"),
|
||
|
related_name="lanes1",
|
||
|
on_delete=models.CASCADE,
|
||
|
)
|
||
|
star2 = models.ForeignKey(
|
||
|
GalaxyStar,
|
||
|
verbose_name=_("galaxy star 2"),
|
||
|
related_name="lanes2",
|
||
|
on_delete=models.CASCADE,
|
||
|
)
|
||
|
distance = models.PositiveIntegerField(
|
||
|
_("distance"),
|
||
|
default=0,
|
||
|
help_text=_("Distance separating star1 and star2"),
|
||
|
)
|
||
|
family = models.PositiveIntegerField(
|
||
|
_("family score"),
|
||
|
default=0,
|
||
|
)
|
||
|
pictures = models.PositiveIntegerField(
|
||
|
_("pictures score"),
|
||
|
default=0,
|
||
|
)
|
||
|
clubs = models.PositiveIntegerField(
|
||
|
_("clubs score"),
|
||
|
default=0,
|
||
|
)
|
||
|
|
||
|
|
||
|
class StarDict(TypedDict):
|
||
|
id: int
|
||
|
name: str
|
||
|
mass: int
|
||
|
|
||
|
|
||
|
class GalaxyDict(TypedDict):
|
||
|
nodes: List[StarDict]
|
||
|
links: List
|
||
|
|
||
|
|
||
|
class Galaxy(models.Model):
|
||
|
logger = logging.getLogger("main")
|
||
|
|
||
|
GALAXY_SCALE_FACTOR = 2_000
|
||
|
FAMILY_LINK_POINTS = 366 # Equivalent to a leap year together in a club, because.
|
||
|
PICTURE_POINTS = 2 # Equivalent to two days as random members of a club.
|
||
|
CLUBS_POINTS = 1 # One day together as random members in a club is one point.
|
||
|
|
||
|
state = models.JSONField("current state")
|
||
|
|
||
|
@staticmethod
|
||
|
def make_state() -> None:
|
||
|
"""
|
||
|
Compute JSON structure to send to 3d-force-graph: https://github.com/vasturiano/3d-force-graph/
|
||
|
"""
|
||
|
without_nickname = Concat(
|
||
|
F("owner__first_name"), Value(" "), F("owner__last_name")
|
||
|
)
|
||
|
with_nickname = Concat(
|
||
|
F("owner__first_name"),
|
||
|
Value(" "),
|
||
|
F("owner__last_name"),
|
||
|
Value(" ("),
|
||
|
F("owner__nick_name"),
|
||
|
Value(")"),
|
||
|
)
|
||
|
stars = GalaxyStar.objects.annotate(
|
||
|
owner_name=Case(
|
||
|
When(owner__nick_name=None, then=without_nickname),
|
||
|
default=with_nickname,
|
||
|
)
|
||
|
)
|
||
|
lanes = GalaxyLane.objects.annotate(
|
||
|
star1_owner=F("star1__owner__id"),
|
||
|
star2_owner=F("star2__owner__id"),
|
||
|
)
|
||
|
json = GalaxyDict(
|
||
|
nodes=[
|
||
|
StarDict(id=star.owner_id, name=star.owner_name, mass=star.mass)
|
||
|
for star in stars
|
||
|
],
|
||
|
links=[],
|
||
|
)
|
||
|
# Make bidirectional links
|
||
|
# TODO: see if this impacts performance with a big graph
|
||
|
for path in lanes:
|
||
|
json["links"].append(
|
||
|
{
|
||
|
"source": path.star1_owner,
|
||
|
"target": path.star2_owner,
|
||
|
"value": path.distance,
|
||
|
}
|
||
|
)
|
||
|
json["links"].append(
|
||
|
{
|
||
|
"source": path.star2_owner,
|
||
|
"target": path.star1_owner,
|
||
|
"value": path.distance,
|
||
|
}
|
||
|
)
|
||
|
Galaxy.objects.all().delete()
|
||
|
Galaxy(state=json).save()
|
||
|
|
||
|
###################
|
||
|
# User self score #
|
||
|
###################
|
||
|
|
||
|
@classmethod
|
||
|
def compute_user_score(cls, user) -> int:
|
||
|
"""
|
||
|
This compute an individual score for each citizen. It will later be used by the graph algorithm to push
|
||
|
higher scores towards the center of the galaxy.
|
||
|
|
||
|
Idea: This could be added to the computation:
|
||
|
- Forum posts
|
||
|
- Picture count
|
||
|
- Counter consumption
|
||
|
- Barman time
|
||
|
- ...
|
||
|
"""
|
||
|
user_score = 1
|
||
|
user_score += cls.query_user_score(user)
|
||
|
|
||
|
# TODO:
|
||
|
# Scale that value with some magic number to accommodate to typical data
|
||
|
# Really active galaxy citizen after 5 years typically have a score of about XXX
|
||
|
# Citizen that were seen regularly without taking much part in organizations typically have a score of about XXX
|
||
|
# Citizen that only went to a few events typically score about XXX
|
||
|
user_score = int(math.log2(user_score))
|
||
|
|
||
|
return user_score
|
||
|
|
||
|
@classmethod
|
||
|
def query_user_score(cls, user) -> int:
|
||
|
score_query = (
|
||
|
User.objects.filter(id=user.id)
|
||
|
.annotate(
|
||
|
godchildren_count=Count("godchildren", distinct=True)
|
||
|
* cls.FAMILY_LINK_POINTS,
|
||
|
godfathers_count=Count("godfathers", distinct=True)
|
||
|
* cls.FAMILY_LINK_POINTS,
|
||
|
pictures_score=Count("pictures", distinct=True) * cls.PICTURE_POINTS,
|
||
|
clubs_score=Count("memberships", distinct=True) * cls.CLUBS_POINTS,
|
||
|
)
|
||
|
.aggregate(
|
||
|
score=models.Sum(
|
||
|
F("godchildren_count")
|
||
|
+ F("godfathers_count")
|
||
|
+ F("pictures_score")
|
||
|
+ F("clubs_score")
|
||
|
)
|
||
|
)
|
||
|
)
|
||
|
return score_query.get("score")
|
||
|
|
||
|
####################
|
||
|
# Inter-user score #
|
||
|
####################
|
||
|
|
||
|
@classmethod
|
||
|
def compute_users_score(cls, user1, user2) -> Tuple[int, int, int, int]:
|
||
|
family = cls.compute_users_family_score(user1, user2)
|
||
|
pictures = cls.compute_users_pictures_score(user1, user2)
|
||
|
clubs = cls.compute_users_clubs_score(user1, user2)
|
||
|
score = family + pictures + clubs
|
||
|
return score, family, pictures, clubs
|
||
|
|
||
|
@classmethod
|
||
|
def compute_users_family_score(cls, user1, user2) -> int:
|
||
|
link_count = User.objects.filter(
|
||
|
Q(id=user1.id, godfathers=user2) | Q(id=user2.id, godfathers=user1)
|
||
|
).count()
|
||
|
if link_count:
|
||
|
cls.logger.debug(
|
||
|
f"\t\t- '{user1}' and '{user2}' have {link_count} direct family link"
|
||
|
)
|
||
|
return link_count * cls.FAMILY_LINK_POINTS
|
||
|
|
||
|
@classmethod
|
||
|
def compute_users_pictures_score(cls, user1, user2) -> int:
|
||
|
picture_count = (
|
||
|
Picture.objects.filter(people__user__in=(user1,))
|
||
|
.filter(people__user__in=(user2,))
|
||
|
.count()
|
||
|
)
|
||
|
if picture_count:
|
||
|
cls.logger.debug(
|
||
|
f"\t\t- '{user1}' was pictured with '{user2}' {picture_count} times"
|
||
|
)
|
||
|
return picture_count * cls.PICTURE_POINTS
|
||
|
|
||
|
@classmethod
|
||
|
def compute_users_clubs_score(cls, user1, user2) -> int:
|
||
|
common_clubs = Club.objects.filter(members__in=user1.memberships.all()).filter(
|
||
|
members__in=user2.memberships.all()
|
||
|
)
|
||
|
user1_memberships = user1.memberships.filter(club__in=common_clubs)
|
||
|
user2_memberships = user2.memberships.filter(club__in=common_clubs)
|
||
|
|
||
|
score = 0
|
||
|
for user1_membership in user1_memberships:
|
||
|
if user1_membership.end_date is None:
|
||
|
user1_membership.end_date = timezone.now().date()
|
||
|
query = Q( # start2 <= start1 <= end2
|
||
|
start_date__lte=user1_membership.start_date,
|
||
|
end_date__gte=user1_membership.start_date,
|
||
|
)
|
||
|
query |= Q( # start2 <= start1 <= now
|
||
|
start_date__lte=user1_membership.start_date, end_date=None
|
||
|
)
|
||
|
query |= Q( # start1 <= start2 <= end2
|
||
|
start_date__gte=user1_membership.start_date,
|
||
|
start_date__lte=user1_membership.end_date,
|
||
|
)
|
||
|
for user2_membership in user2_memberships.filter(
|
||
|
query, club=user1_membership.club
|
||
|
):
|
||
|
if user2_membership.end_date is None:
|
||
|
user2_membership.end_date = timezone.now().date()
|
||
|
latest_start = max(
|
||
|
user1_membership.start_date, user2_membership.start_date
|
||
|
)
|
||
|
earliest_end = min(user1_membership.end_date, user2_membership.end_date)
|
||
|
cls.logger.debug(
|
||
|
"\t\t- '%s' was with '%s' in %s starting on %s until %s (%s days)"
|
||
|
% (
|
||
|
user1,
|
||
|
user2,
|
||
|
user2_membership.club,
|
||
|
latest_start,
|
||
|
earliest_end,
|
||
|
(earliest_end - latest_start).days,
|
||
|
)
|
||
|
)
|
||
|
score += cls.CLUBS_POINTS * (earliest_end - latest_start).days
|
||
|
return score
|
||
|
|
||
|
###################
|
||
|
# Rule the galaxy #
|
||
|
###################
|
||
|
|
||
|
@classmethod
|
||
|
def rule(cls) -> None:
|
||
|
GalaxyStar.objects.all().delete()
|
||
|
# The following is a no-op thanks to cascading, but in case that changes in the future, better keep it anyway.
|
||
|
GalaxyLane.objects.all().delete()
|
||
|
rulable_users = (
|
||
|
User.objects.filter(subscriptions__isnull=False)
|
||
|
.filter(
|
||
|
Q(godchildren__isnull=False)
|
||
|
| Q(godfathers__isnull=False)
|
||
|
| Q(pictures__isnull=False)
|
||
|
| Q(memberships__isnull=False)
|
||
|
)
|
||
|
.distinct()
|
||
|
)
|
||
|
# force fetch of the whole query to make sure there won't
|
||
|
# be any more db hits
|
||
|
# this is memory expensive but prevents a lot of db hits, therefore
|
||
|
# is far more time efficient
|
||
|
rulable_users = list(rulable_users)
|
||
|
while len(rulable_users) > 0:
|
||
|
user1 = rulable_users.pop()
|
||
|
for user2 in rulable_users:
|
||
|
cls.logger.debug("")
|
||
|
cls.logger.debug(f"\t> Ruling '{user1}' against '{user2}'")
|
||
|
star1, _ = GalaxyStar.objects.get_or_create(owner=user1)
|
||
|
star2, _ = GalaxyStar.objects.get_or_create(owner=user2)
|
||
|
if star1.mass == 0:
|
||
|
star1.mass = cls.compute_user_score(user1)
|
||
|
star1.save()
|
||
|
if star2.mass == 0:
|
||
|
star2.mass = cls.compute_user_score(user2)
|
||
|
star2.save()
|
||
|
users_score, family, pictures, clubs = cls.compute_users_score(
|
||
|
user1, user2
|
||
|
)
|
||
|
if users_score > 0:
|
||
|
GalaxyLane(
|
||
|
star1=star1,
|
||
|
star2=star2,
|
||
|
distance=cls.scale_distance(users_score),
|
||
|
family=family,
|
||
|
pictures=pictures,
|
||
|
clubs=clubs,
|
||
|
).save()
|
||
|
|
||
|
@classmethod
|
||
|
def scale_distance(cls, value) -> int:
|
||
|
# TODO: this will need adjustements with the real, typical data on Taiste
|
||
|
|
||
|
cls.logger.debug(f"\t\t> Score: {value}")
|
||
|
# Invert score to draw close users together
|
||
|
value = 1 / value # Cannot be 0
|
||
|
value += 2 # We use log2 just below and need to stay above 1
|
||
|
value = ( # Let's get something in the range ]0; log2(3)-1≈0.58[ that we can multiply later
|
||
|
math.log2(value) - 1
|
||
|
)
|
||
|
value *= ( # Scale that value with a magic number to accommodate to typical data
|
||
|
# Really close galaxy citizen after 5 years typically have a score of about XXX
|
||
|
# Citizen that were in the same year without being really friends typically have a score of about XXX
|
||
|
# Citizen that have met once or twice only have a couple of pictures together typically score about XXX
|
||
|
cls.GALAXY_SCALE_FACTOR
|
||
|
)
|
||
|
cls.logger.debug(f"\t\t> Scaled distance: {value}")
|
||
|
return int(value)
|