bounties_api/analytics/management/commands/timeline_generator.py

from datetime import datetime, timedelta
from functools import reduce

import arrow
from django.core.management import BaseCommand
from django.db.models import Q, Sum

from analytics.models import BountiesTimeline
from std_bounties.constants import EXPIRED_STAGE, DEAD_STAGE, COMPLETED_STAGE, ACTIVE_STAGE, DRAFT_STAGE
from std_bounties.models import BountyState, Fulfillment


ALL_PLATFORM = 'all'
DEFAULT_PLATFORM = 'bounties-network'
DEFAULT_PLATFORM_QUERY = Q(bounty__platform=DEFAULT_PLATFORM) | Q(bounty__platform=None) | Q(bounty__platform='')


def diff_time(since, until):
    return until - since


def diff_days(last_update, now=datetime.utcnow()):
    return (diff_time(now, last_update)).days


def day_bounds(day):
    utc_day = arrow.get(day).to('utc')
    floor = utc_day.floor('day')
    ceil = utc_day.ceil('day')

    return floor.datetime, ceil.datetime


def week_bounds(day):
    utc_day = arrow.get(day).to('utc')
    floor = utc_day.floor('week')
    ceil = utc_day.ceil('week')

    return floor.datetime, ceil.datetime


def range_days(since, until):
    return arrow.Arrow.range('day', since, until)


def range_weeks(since, until):
    return arrow.Arrow.range('week', since, until)


def get_date(time_frame):
    return time_frame.last().change_date


def add_on(stage):
    return lambda current, next_value: current + \
        1 if next_value.bounty_stage == stage else current


def get_bounties_issued(time_frame):
    return time_frame.distinct('bounty').count()


def get_fulfillments_submitted(time_frame):
    return time_frame.count()


def get_fulfillments_accepted(time_frame):
    return time_frame.count()


def get_fulfillment_acceptance_rate(time_frame, accepted_date=datetime.now()):
    counter = time_frame.count()
    return time_frame.filter(
        accepted_date__lte=accepted_date).count() / counter if counter else 0


def get_bounty_fulfilled_rate(time_frame, bounties):
    counter = bounties.count()
    return time_frame.distinct('bounty').count() / \
        bounties.count() if counter else 0


def get_avg_fulfiller_acceptance_rate(
        time_frame, accepted_date=datetime.now()):
    fulfillers = [b['fulfiller']
                  for b in time_frame.values('fulfiller').distinct()]
    counter = 0
    accumulator = 0

    for fulfiller in fulfillers:
        fulfillments = time_frame.filter(fulfiller=fulfiller)
        accepted_fulfillments = fulfillments.filter(
            accepted=True, accepted_date__lte=accepted_date).count()
        accumulator += accepted_fulfillments / fulfillments.count()
        counter += 1

    return accumulator / counter if counter > 0 else 0


def get_total_amount_paid(time_frame, accepted_date=datetime.now()):
    fulfillers = [b['fulfiller']
                  for b in time_frame.values('fulfiller').distinct()]

    total = 0
    for fulfiller in fulfillers:
        fulfillments = time_frame.filter(fulfiller=fulfiller)
        accepted_fulfillments = fulfillments.filter(
            accepted=True, accepted_date__lte=accepted_date)
        sum_fulfillments = accepted_fulfillments.aggregate(Sum('usd_price')).get('usd_price__sum')
        total += sum_fulfillments if sum_fulfillments is not None else 0
    return total


def get_avg_fulfillment_amount(time_frame):
    completed_bounties = filter(
        lambda bounty: bounty.bounty_stage == COMPLETED_STAGE,
        time_frame)
    (total, count) = reduce(lambda prev, current: (
        prev[0] + current.bounty.usd_price, prev[1] + 1), completed_bounties, (0, 0))

    return total / count if count > 0 else 0


def get_total_fulfillment_amount(time_frame):
    completed_bounties = filter(
        lambda bounty: bounty.bounty_stage == COMPLETED_STAGE,
        time_frame)
    return reduce(
        lambda prev,
        current: prev +
        current.bounty.fulfillment_amount,
        completed_bounties,
        0)


def get_total_unique_issuers(time_frame):
    return time_frame.distinct('bounty').values('bounty__issuer_address').distinct().count()


def get_total_unique_fulfillers(time_frame):
    return time_frame.values('fulfiller').distinct().count()


def get_bounty_draft(time_frame):
    return reduce(add_on(DRAFT_STAGE), time_frame, 0)


def get_bounty_active(time_frame):
    return reduce(add_on(ACTIVE_STAGE), time_frame, 0)


def get_bounty_completed(time_frame):
    return reduce(add_on(COMPLETED_STAGE), time_frame, 0)


def get_bounty_expired(time_frame):
    return reduce(add_on(EXPIRED_STAGE), time_frame, 0)


def get_bounty_dead(time_frame):
    return reduce(add_on(DEAD_STAGE), time_frame, 0)


def build_stages(time_frame):
    """ Build the total for each bounty stage in a given time frame
    1. In a given time frame, are retrieved all distinct bounties
    2. Get the last stage for the bounty
    3. Increment the counter for the given stage
    Each position correspond in the stage array correspond to the stage in `constants.py`:
        DRAFT_STAGE = 0
        ACTIVE_STAGE = 1
        DEAD_STAGE = 2
        COMPLETED_STAGE = 3
        EXPIRED_STAGE = 4
    returns [total_drafts, total_active, total_dead, total_completed, total_expired], {bounty: [STAGES...]}
    **Each total correspond to the last stages of the bounties in the given time frame**
    """
    # TODO: Queries optimization
    unique_bounties = [b['bounty']
                       for b in time_frame.values('bounty').distinct()]

    stages = [0, 0, 0, 0, 0]
    bounty_stages = {}
    for bounty_id in unique_bounties:
        bounty_states = time_frame.filter(
            bounty=bounty_id).order_by(
            '-change_date',
            '-bounty_stage')
        bounty_stages[bounty_id] = map(lambda b: b.bounty_stage, bounty_states)
        current_stage = bounty_states.first().bounty_stage
        stages[current_stage] = stages[current_stage] + 1

    return stages, bounty_stages


def get_noise_bounties(bounties):
    noise_bounty_dead = sorted([DRAFT_STAGE, DEAD_STAGE])
    noise_bounty_draft = [DRAFT_STAGE]
    noise = []
    for (bounty, stages) in bounties.items():
        sorted_stages = sorted(stages)
        if sorted_stages == noise_bounty_dead or sorted_stages == noise_bounty_draft:
            noise = [bounty] + noise

    return noise


def generate_timeline(time_frame, platform=DEFAULT_PLATFORM):
    date = time_frame[1]
    bounty_state_platform = BountyState.objects
    fulfillment_platform = Fulfillment.objects

    if platform == DEFAULT_PLATFORM:
        bounty_state_platform = bounty_state_platform.select_related('bounty').filter(DEFAULT_PLATFORM_QUERY)
        fulfillment_platform = fulfillment_platform.select_related('bounty').filter(DEFAULT_PLATFORM_QUERY)
    elif platform and platform != ALL_PLATFORM:
        bounty_state_platform = bounty_state_platform.select_related('bounty').filter(
            bounty__platform=platform)
        fulfillment_platform = fulfillment_platform.select_related('bounty').filter(
            bounty__platform=platform)

    bounties_state_frame_day = bounty_state_platform.filter(
        change_date__range=time_frame, bounty_stage=DRAFT_STAGE)
    bounties_state_frame = bounty_state_platform.filter(
        change_date__lte=time_frame[1])
    fulfillment_accepted_frame = fulfillment_platform.filter(
        accepted_date__lte=time_frame[1])
    fulfillment_accepted_frame_day = fulfillment_platform.filter(
        accepted_date__range=time_frame)
    fulfillment_submitted_frame = fulfillment_platform.filter(
        fulfillment_created__lte=time_frame[1])
    fulfillment_submitted_frame_day = fulfillment_platform.filter(
        fulfillment_created__range=time_frame)

    stages, bounties = build_stages(bounties_state_frame)

    noise_bounties = get_noise_bounties(bounties)

    bounties_issued = get_bounties_issued(bounties_state_frame_day)
    bounties_issued_cum = get_bounties_issued(bounties_state_frame)

    fulfillments_submitted = get_fulfillments_submitted(
        fulfillment_submitted_frame_day)
    fulfillments_submitted_cum = get_fulfillments_submitted(
        fulfillment_submitted_frame)

    fulfillments_accepted = get_fulfillments_accepted(
        fulfillment_accepted_frame_day)
    fulfillments_accepted_cum = get_fulfillments_accepted(
        fulfillment_accepted_frame)

    # Also - a bounty can be active and still have an accepted fulfillment.
    # For example, a bounty may have a high balance to output multiple fulfillments.
    # So there is a slight error here.
    # Also, we probably want to not include bounties from the count that never were in an active state.
    # ie. a bounty that was in draft forever, or was killed after being in
    # draft.

    fulfillment_acceptance_rate = get_fulfillment_acceptance_rate(
        fulfillment_submitted_frame, date)

    bounty_fulfilled_rate = get_bounty_fulfilled_rate(
        fulfillment_submitted_frame,
        bounties_state_frame .distinct('bounty') .exclude(
            bounty__in=noise_bounties))

    avg_fulfiller_acceptance_rate = get_avg_fulfiller_acceptance_rate(
        fulfillment_submitted_frame, date)

    avg_fulfillment_amount = get_avg_fulfillment_amount(bounties_state_frame)
    total_fulfillment_amount = get_total_amount_paid(fulfillment_accepted_frame, date)

    total_unique_issuers = get_total_unique_issuers(bounties_state_frame_day)
    total_unique_issuers_cum = get_total_unique_issuers(bounties_state_frame)
    total_unique_fulfillers = get_total_unique_fulfillers(fulfillment_submitted_frame_day)
    total_unique_fulfillers_cum = get_total_unique_fulfillers(fulfillment_submitted_frame)

    bounty_frame = BountiesTimeline(
        date=time_frame[0],
        bounties_issued=bounties_issued,
        bounties_issued_cum=bounties_issued_cum,
        fulfillments_submitted_cum=fulfillments_submitted_cum,
        fulfillments_submitted=fulfillments_submitted,
        fulfillments_accepted_cum=fulfillments_accepted_cum,
        fulfillments_accepted=fulfillments_accepted,
        fulfillments_pending_acceptance=fulfillments_submitted_cum -
        fulfillments_accepted_cum,
        fulfillment_acceptance_rate=fulfillment_acceptance_rate,
        bounty_fulfilled_rate=bounty_fulfilled_rate,
        avg_fulfiller_acceptance_rate=avg_fulfiller_acceptance_rate,
        avg_fulfillment_amount=avg_fulfillment_amount,
        total_fulfillment_amount=total_fulfillment_amount,
        total_unique_issuers=total_unique_issuers,
        total_unique_issuers_cum=total_unique_issuers_cum,
        total_unique_fulfillers=total_unique_fulfillers,
        total_unique_fulfillers_cum=total_unique_fulfillers_cum,
        bounty_draft=stages[DRAFT_STAGE],
        bounty_active=stages[ACTIVE_STAGE],
        bounty_completed=stages[COMPLETED_STAGE],
        bounty_expired=stages[EXPIRED_STAGE],
        bounty_dead=stages[DEAD_STAGE],
        platform=platform)

    return bounty_frame


class Command(BaseCommand):
    def handle(self, *args, **options):
        platform_query = BountyState.objects.distinct('bounty__platform')
        platforms = [p.bounty.platform for p in platform_query if p.bounty.platform] + [ALL_PLATFORM]

        for platform in platforms:
            needs_genesis = not BountiesTimeline.objects.filter(
                platform=platform, is_week=False).exists()

            first_date = BountyState.objects.first()
            last_date = datetime.utcnow()

            if needs_genesis:
                bounties_by_day = range_days(
                    first_date.change_date,
                    last_date +
                    timedelta(
                        days=1))

                for day in bounties_by_day:
                    bounty_day = generate_timeline(
                        day_bounds(day), platform=platform)

                    bounty_day.save()
            else:
                last_update = BountiesTimeline.objects.filter(
                    platform=platform, is_week=False).order_by('date').last()
                since = arrow.get(last_update.date).to('utc')
                days = range_days(since, datetime.utcnow())

                # Instead of calculate the last 5 min, we update all day until now
                # this approach provides more flexibility and simplicity in calculating more stats in the future
                # and provides a better way to expose by day or by hour in case
                # of been needed
                for day in days:
                    bounty_day = generate_timeline(
                        day_bounds(day), platform=platform)
                    bounty_points = BountiesTimeline.objects.filter(
                        date=day.date(), platform=platform, is_week=False)

                    if bounty_points.exists():
                        bounty_point = bounty_points.first()
                        bounty_day.id = bounty_point.id

                    bounty_day.save()

        for platform in platforms:
            needs_genesis = not BountiesTimeline.objects.filter(
                platform=platform, is_week=True).exists()

            first_date = BountyState.objects.first()
            last_date = datetime.utcnow()

            if needs_genesis:
                bounties_by_week = range_weeks(
                    first_date.change_date, last_date + timedelta(days=7))

                for week in bounties_by_week:
                    bounty_week = generate_timeline(
                        week_bounds(week), platform=platform)
                    bounty_week.is_week = True

                    bounty_week.save()
            else:
                last_update = BountiesTimeline.objects.filter(
                    platform=platform, is_week=True).order_by('date').last()
                since = arrow.get(last_update.date).to('utc')
                weeks = range_weeks(since, datetime.utcnow())

                for week in weeks:
                    bounds = week_bounds(week)
                    bounty_week = generate_timeline(bounds, platform=platform)
                    bounty_points = BountiesTimeline.objects.filter(
                        date=bounds[0].date(), platform=platform, is_week=True)

                    if bounty_points.exists():
                        bounty_point = bounty_points.first()
                        bounty_week.id = bounty_point.id

                    bounty_week.is_week = True
                    bounty_week.save()