0
0
mirror of https://github.com/PostHog/posthog.git synced 2024-11-28 09:16:49 +01:00
posthog/ee/clickhouse/views/test/test_clickhouse_trends.py
2023-05-25 16:31:35 +01:00

1457 lines
56 KiB
Python
Raw Blame History

This file contains invisible Unicode characters

This file contains invisible Unicode characters that are indistinguishable to humans but may be processed differently by a computer. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

import json
from dataclasses import dataclass, field
from datetime import datetime
from typing import Any, Dict, List, Optional, Union
from unittest.case import skip
from unittest.mock import ANY
import pytest
from django.core.cache import cache
from django.test import Client
from freezegun import freeze_time
from ee.api.test.base import LicensedTestMixin
from posthog.api.test.test_cohort import create_cohort_ok
from posthog.api.test.test_event_definition import create_organization, create_team, create_user
from posthog.models.group.util import create_group
from posthog.models.group_type_mapping import GroupTypeMapping
from posthog.models.instance_setting import set_instance_setting
from posthog.models.team import Team
from posthog.test.base import (
APIBaseTest,
ClickhouseTestMixin,
_create_person,
also_test_with_materialized_columns,
snapshot_clickhouse_queries,
)
from posthog.test.test_journeys import journeys_for, update_or_create_person
@pytest.mark.django_db
@pytest.mark.ee
def test_includes_only_intervals_within_range(client: Client):
"""
This is the case highlighted by https://github.com/PostHog/posthog/issues/2675
Here the issue is that we request, for instance, 14 days as the
date_from, display at weekly intervals but previously we
were displaying 4 ticks on the date axis. If we were exactly on the
beginning of the week for two weeks then we'd want 2 ticks.
Otherwise we would have 3 ticks as the range would be intersecting
with three weeks. We should never need to display 4 ticks.
"""
organization = create_organization(name="test org")
team = create_team(organization=organization)
user = create_user("user", "pass", organization)
client.force_login(user)
cache.clear()
#  I'm creating a cohort here so that I can use as a breakdown, just because
#  this is what was used demonstrated in
#  https://github.com/PostHog/posthog/issues/2675 but it might not be the
#  simplest way to reproduce
# "2021-09-19" is a sunday, i.e. beginning of week
with freeze_time("2021-09-20T16:00:00"):
#  First identify as a member of the cohort
distinct_id = "abc"
update_or_create_person(distinct_ids=[distinct_id], team_id=team.id, properties={"cohort_identifier": 1})
cohort = create_cohort_ok(
client=client,
team_id=team.id,
name="test cohort",
groups=[{"properties": [{"key": "cohort_identifier", "value": 1, "type": "person"}]}],
)
journeys_for(
events_by_person={
distinct_id: [
{"event": "$pageview", "timestamp": "2021-09-04"},
{"event": "$pageview", "timestamp": "2021-09-05"},
{"event": "$pageview", "timestamp": "2021-09-12"},
{"event": "$pageview", "timestamp": "2021-09-19"},
]
},
team=team,
)
trends = get_trends_ok(
client,
team=team,
request=TrendsRequestBreakdown(
date_from="-14days",
date_to="2021-09-21",
interval="week",
insight="TRENDS",
breakdown=json.dumps([cohort["id"]]),
breakdown_type="cohort",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
),
)
assert trends == {
"is_cached": False,
"last_refresh": "2021-09-20T16:00:00Z",
"next": None,
"timezone": "UTC",
"result": [
{
"action": ANY,
"breakdown_value": cohort["id"],
"label": "$pageview - test cohort",
"count": 3.0,
"data": [1.0, 1.0, 1.0],
# Prior to the fix this would also include '29-Aug-2021'
"labels": ["5-Sep-2021", "12-Sep-2021", "19-Sep-2021"],
"days": ["2021-09-05", "2021-09-12", "2021-09-19"],
"persons_urls": ANY,
"filter": ANY,
}
],
}
@pytest.mark.django_db
@pytest.mark.ee
def test_can_specify_number_of_smoothing_intervals(client: Client):
"""
The Smoothing feature should allow specifying a number of intervals over
which we will provide smoothing of the aggregated trend data.
"""
organization = create_organization(name="test org")
team = create_team(organization=organization)
user = create_user("user", "pass", organization)
client.force_login(user)
with freeze_time("2021-09-20T16:00:00"):
journeys_for(
events_by_person={
"abc": [
{"event": "$pageview", "timestamp": "2021-09-01"},
{"event": "$pageview", "timestamp": "2021-09-01"},
{"event": "$pageview", "timestamp": "2021-09-02"},
{"event": "$pageview", "timestamp": "2021-09-03"},
{"event": "$pageview", "timestamp": "2021-09-03"},
{"event": "$pageview", "timestamp": "2021-09-03"},
]
},
team=team,
)
interval_3_trend = get_trends_ok(
client,
team=team,
request=TrendsRequest(
date_from="2021-09-01",
date_to="2021-09-03",
interval="day",
insight="TRENDS",
display="ActionsLineGraph",
smoothing_intervals=3,
events=[
{
"id": "$pageview",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
}
],
),
)
assert interval_3_trend == {
"is_cached": False,
"last_refresh": "2021-09-20T16:00:00Z",
"next": None,
"timezone": "UTC",
"result": [
{
"action": ANY,
"label": "$pageview",
"count": 5,
"data": [2.0, 1, 2.0],
"labels": ["1-Sep-2021", "2-Sep-2021", "3-Sep-2021"],
"days": ["2021-09-01", "2021-09-02", "2021-09-03"],
"persons_urls": ANY,
"filter": ANY,
}
],
}
interval_2_trend = get_trends_ok(
client,
team=team,
request=TrendsRequest(
date_from="2021-09-01",
date_to="2021-09-03",
interval="day",
insight="TRENDS",
display="ActionsLineGraph",
smoothing_intervals=2,
events=[
{
"id": "$pageview",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
}
],
),
)
assert interval_2_trend == {
"is_cached": False,
"last_refresh": "2021-09-20T16:00:00Z",
"next": None,
"timezone": "UTC",
"result": [
{
"action": ANY,
"label": "$pageview",
"count": 5,
"data": [2.0, 1, 2.0],
"labels": ["1-Sep-2021", "2-Sep-2021", "3-Sep-2021"],
"days": ["2021-09-01", "2021-09-02", "2021-09-03"],
"persons_urls": ANY,
"filter": ANY,
}
],
}
interval_1_trend = get_trends_ok(
client,
team=team,
request=TrendsRequest(
date_from="2021-09-01",
date_to="2021-09-03",
interval="day",
insight="TRENDS",
display="ActionsLineGraph",
smoothing_intervals=1,
events=[
{
"id": "$pageview",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
}
],
),
)
assert interval_1_trend == {
"is_cached": False,
"last_refresh": "2021-09-20T16:00:00Z",
"next": None,
"timezone": "UTC",
"result": [
{
"action": {
"id": "$pageview",
"type": "events",
"order": 0,
"name": "$pageview",
"custom_name": None,
"math": None,
"math_hogql": None,
"math_property": None,
"math_group_type_index": ANY,
"properties": {},
},
"label": "$pageview",
"count": 6.0,
"data": [2.0, 1.0, 3.0],
"labels": ["1-Sep-2021", "2-Sep-2021", "3-Sep-2021"],
"days": ["2021-09-01", "2021-09-02", "2021-09-03"],
"persons_urls": ANY,
"filter": ANY,
}
],
}
@pytest.mark.django_db
@pytest.mark.ee
def test_smoothing_intervals_copes_with_null_values(client: Client):
"""
The Smoothing feature should allow specifying a number of intervals over
which we will provide smoothing of the aggregated trend data.
"""
organization = create_organization(name="test org")
team = create_team(organization=organization)
user = create_user("user", "pass", organization)
client.force_login(user)
cache.clear()
with freeze_time("2021-09-20T16:00:00"):
journeys_for(
events_by_person={
"abc": [
{"event": "$pageview", "timestamp": "2021-09-01"},
{"event": "$pageview", "timestamp": "2021-09-01"},
{"event": "$pageview", "timestamp": "2021-09-01"},
# No events on 2 Sept
{"event": "$pageview", "timestamp": "2021-09-03"},
{"event": "$pageview", "timestamp": "2021-09-03"},
{"event": "$pageview", "timestamp": "2021-09-03"},
]
},
team=team,
)
interval_3_trend = get_trends_ok(
client,
team=team,
request=TrendsRequest(
date_from="2021-09-01",
date_to="2021-09-03",
interval="day",
insight="TRENDS",
display="ActionsLineGraph",
smoothing_intervals=3,
events=[
{
"id": "$pageview",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
}
],
),
)
assert interval_3_trend == {
"is_cached": False,
"last_refresh": "2021-09-20T16:00:00Z",
"next": None,
"timezone": "UTC",
"result": [
{
"action": ANY,
"label": "$pageview",
"count": 6.0,
"data": [3.0, 1.0, 2.0],
"labels": ["1-Sep-2021", "2-Sep-2021", "3-Sep-2021"],
"days": ["2021-09-01", "2021-09-02", "2021-09-03"],
"persons_urls": ANY,
"filter": ANY,
}
],
}
interval_1_trend = get_trends_ok(
client,
team=team,
request=TrendsRequest(
date_from="2021-09-01",
date_to="2021-09-03",
interval="day",
insight="TRENDS",
display="ActionsLineGraph",
smoothing_intervals=1,
events=[
{
"id": "$pageview",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
}
],
),
)
assert interval_1_trend == {
"is_cached": False,
"last_refresh": "2021-09-20T16:00:00Z",
"next": None,
"timezone": "UTC",
"result": [
{
"action": ANY,
"label": "$pageview",
"count": 6.0,
"data": [3.0, 0.0, 3.0],
"labels": ["1-Sep-2021", "2-Sep-2021", "3-Sep-2021"],
"days": ["2021-09-01", "2021-09-02", "2021-09-03"],
"persons_urls": ANY,
"filter": ANY,
}
],
}
@dataclass
class TrendsRequest:
date_from: Optional[str] = None
date_to: Optional[str] = None
interval: Optional[str] = None
insight: Optional[str] = None
display: Optional[str] = None
compare: Optional[bool] = None
events: List[Dict[str, Any]] = field(default_factory=list)
properties: List[Dict[str, Any]] = field(default_factory=list)
smoothing_intervals: Optional[int] = 1
refresh: Optional[bool] = False
@dataclass
class TrendsRequestBreakdown(TrendsRequest):
breakdown: Optional[Union[List[int], str]] = None
breakdown_type: Optional[str] = None
def get_trends(client, request: Union[TrendsRequestBreakdown, TrendsRequest], team: Team):
data: Dict[str, Any] = {
"date_from": request.date_from,
"date_to": request.date_to,
"interval": request.interval,
"insight": request.insight,
"display": request.display,
"compare": request.compare,
"events": json.dumps(request.events),
"properties": json.dumps(request.properties),
"smoothing_intervals": request.smoothing_intervals,
"refresh": request.refresh,
}
if isinstance(request, TrendsRequestBreakdown):
data["breakdown"] = request.breakdown
data["breakdown_type"] = request.breakdown_type
filtered_data = {k: v for k, v in data.items() if v is not None}
return client.get(f"/api/projects/{team.id}/insights/trend/", data=filtered_data)
def get_trends_ok(client: Client, request: TrendsRequest, team: Team):
response = get_trends(client=client, request=request, team=team)
assert response.status_code == 200, response.content
return response.json()
@dataclass
class NormalizedTrendResult:
value: float
label: str
person_url: str
breakdown_value: Optional[Union[str, int]]
def get_trends_time_series_ok(
client: Client, request: TrendsRequest, team: Team, with_order: bool = False
) -> Dict[str, Dict[str, NormalizedTrendResult]]:
data = get_trends_ok(client=client, request=request, team=team)
res = {}
for item in data["result"]:
collect_dates = {}
for idx, date in enumerate(item["days"]):
collect_dates[date] = NormalizedTrendResult(
value=item["data"][idx],
label=item["labels"][idx],
person_url=item["persons_urls"][idx]["url"],
breakdown_value=item.get("breakdown_value", None),
)
suffix = " - {}".format(item["compare_label"]) if item.get("compare_label") else ""
if with_order:
suffix += " - {}".format(item["action"]["order"]) if item["action"].get("order") is not None else ""
res["{}{}".format(item["label"], suffix)] = collect_dates
return res
def get_trends_aggregate_ok(client: Client, request: TrendsRequest, team: Team) -> Dict[str, NormalizedTrendResult]:
data = get_trends_ok(client=client, request=request, team=team)
res = {}
for item in data["result"]:
res[item["label"]] = NormalizedTrendResult(
value=item["aggregated_value"],
label=item["action"]["name"],
person_url=item["persons"]["url"],
breakdown_value=item.get("breakdown_value", None),
)
return res
def get_trends_people_ok(client: Client, url: str):
response = client.get("/" + url)
assert response.status_code == 200, response.content
return response.json()["results"][0]["people"]
def get_people_from_url_ok(client: Client, url: str):
response = client.get("/" + url)
assert response.status_code == 200, response.content
return response.json()["results"][0]["people"]
class ClickhouseTestTrends(ClickhouseTestMixin, LicensedTestMixin, APIBaseTest):
maxDiff = None
CLASS_DATA_LEVEL_SETUP = False
@snapshot_clickhouse_queries
def test_insight_trends_basic(self):
events_by_person = {
"1": [{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3)}],
"2": [{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3)}],
}
created_people = journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$pageview"]["2012-01-13"].value == 0
assert data["$pageview"]["2012-01-14"].value == 2
assert data["$pageview"]["2012-01-14"].label == "14-Jan-2012"
assert data["$pageview"]["2012-01-15"].value == 0
with freeze_time("2012-01-15T04:01:34.000Z"):
people = get_people_from_url_ok(self.client, data["$pageview"]["2012-01-14"].person_url)
assert sorted([p["id"] for p in people]) == sorted(
[str(created_people["1"].uuid), str(created_people["2"].uuid)]
)
def test_insight_trends_entity_overlap(self):
events_by_person = {
"1": [{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3), "properties": {"key": "val"}}],
"2": [{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3)}],
"3": [{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3)}],
}
created_people = journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
},
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 1,
"properties": [{"key": "key", "value": "val"}],
"math_property": None,
},
],
)
data = get_trends_time_series_ok(self.client, request, self.team, with_order=True)
assert data["$pageview - 0"]["2012-01-13"].value == 0
assert data["$pageview - 0"]["2012-01-14"].value == 3
assert data["$pageview - 1"]["2012-01-14"].value == 1
assert data["$pageview - 0"]["2012-01-14"].label == "14-Jan-2012"
assert data["$pageview - 0"]["2012-01-15"].value == 0
with freeze_time("2012-01-15T04:01:34.000Z"):
people = get_people_from_url_ok(self.client, data["$pageview - 1"]["2012-01-14"].person_url)
assert sorted([p["id"] for p in people]) == sorted([str(created_people["1"].uuid)])
with freeze_time("2012-01-15T04:01:34.000Z"):
people = get_people_from_url_ok(self.client, data["$pageview - 0"]["2012-01-14"].person_url)
assert sorted([p["id"] for p in people]) == sorted(
[str(created_people["1"].uuid), str(created_people["2"].uuid), str(created_people["3"].uuid)]
)
@snapshot_clickhouse_queries
def test_insight_trends_clean_arg(self):
events_by_actor = {
"1": [{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3), "properties": {"key": "val"}}],
"2": [{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3)}],
}
created_actors = journeys_for(events_by_actor, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": None, # this argument will now be removed from the request instead of becoming a string
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [{"key": "key", "value": "val"}],
"math_property": None,
}
],
)
data = get_trends_time_series_ok(self.client, request, self.team)
actors = get_people_from_url_ok(self.client, data["$pageview"]["2012-01-14"].person_url)
# this would return 2 people prior to #8103 fix
# 'None' values have to be purged before formatting into the actor url
assert sorted([p["id"] for p in actors]) == sorted([str(created_actors["1"].uuid)])
@snapshot_clickhouse_queries
def test_insight_trends_aggregate(self):
events_by_person = {
"1": [{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3)}],
"2": [{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3)}],
}
created_people = journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsPie",
events=[
{
"id": "$pageview",
"math": None,
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
)
data = get_trends_aggregate_ok(self.client, request, self.team)
assert data["$pageview"].value == 2
assert data["$pageview"].label == "$pageview"
with freeze_time("2012-01-15T04:01:34.000Z"):
people = get_people_from_url_ok(self.client, data["$pageview"].person_url)
assert sorted([p["id"] for p in people]) == sorted(
[str(created_people["1"].uuid), str(created_people["2"].uuid)]
)
@snapshot_clickhouse_queries
def test_insight_trends_cumulative(self):
_create_person(team_id=self.team.pk, distinct_ids=["p1"], properties={"key": "some_val"})
_create_person(team_id=self.team.pk, distinct_ids=["p2"], properties={"key": "some_val"})
_create_person(team_id=self.team.pk, distinct_ids=["p3"], properties={"key": "some_val"})
events_by_person = {
"p1": [
{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "val"}},
{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3), "properties": {"key": "val"}},
],
"p2": [{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "notval"}}],
"p3": [{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3), "properties": {"key": "val"}}],
}
created_people = journeys_for(events_by_person, self.team)
# Total Volume
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraphCumulative",
events=[
{
"id": "$pageview",
"math": None,
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
)
data_response = get_trends_time_series_ok(self.client, request, self.team)
person_response = get_people_from_url_ok(self.client, data_response["$pageview"]["2012-01-14"].person_url)
assert data_response["$pageview"]["2012-01-13"].value == 2
assert data_response["$pageview"]["2012-01-14"].value == 4
assert data_response["$pageview"]["2012-01-15"].value == 4
assert data_response["$pageview"]["2012-01-14"].label == "14-Jan-2012"
assert sorted([p["id"] for p in person_response]) == sorted(
[str(created_people["p1"].uuid), str(created_people["p2"].uuid), str(created_people["p3"].uuid)]
)
# DAU
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraphCumulative",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
)
data_response = get_trends_time_series_ok(self.client, request, self.team)
person_response = get_people_from_url_ok(self.client, data_response["$pageview"]["2012-01-14"].person_url)
assert data_response["$pageview"]["2012-01-13"].value == 2
assert data_response["$pageview"]["2012-01-14"].value == 3
assert data_response["$pageview"]["2012-01-15"].value == 3
assert data_response["$pageview"]["2012-01-14"].label == "14-Jan-2012"
assert sorted([p["id"] for p in person_response]) == sorted(
[str(created_people["p1"].uuid), str(created_people["p2"].uuid), str(created_people["p3"].uuid)]
)
# breakdown
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequestBreakdown(
date_from="-14d",
display="ActionsLineGraphCumulative",
breakdown="key",
breakdown_type="event",
events=[
{
"id": "$pageview",
"math": None,
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
)
data_response = get_trends_time_series_ok(self.client, request, self.team)
person_response = get_people_from_url_ok(
self.client, data_response["$pageview - val"]["2012-01-14"].person_url
)
assert data_response["$pageview - val"]["2012-01-13"].value == 1
assert data_response["$pageview - val"]["2012-01-13"].breakdown_value == "val"
assert data_response["$pageview - val"]["2012-01-14"].value == 3
assert data_response["$pageview - val"]["2012-01-14"].label == "14-Jan-2012"
assert sorted([p["id"] for p in person_response]) == sorted(
[str(created_people["p1"].uuid), str(created_people["p3"].uuid)]
)
# breakdown wau
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequestBreakdown(
date_from="-14d",
display="ActionsLineGraphCumulative",
breakdown="key",
breakdown_type="event",
events=[
{
"id": "$pageview",
"math": "weekly_active",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [{"type": "person", "key": "key", "value": "some_val"}],
"math_property": None,
}
],
properties=[{"type": "person", "key": "key", "value": "some_val"}],
)
data_response = get_trends_time_series_ok(self.client, request, self.team)
people = get_people_from_url_ok(self.client, data_response["$pageview - val"]["2012-01-14"].person_url)
assert data_response["$pageview - val"]["2012-01-13"].value == 1
assert data_response["$pageview - val"]["2012-01-13"].breakdown_value == "val"
assert data_response["$pageview - val"]["2012-01-14"].value == 3
assert data_response["$pageview - val"]["2012-01-14"].label == "14-Jan-2012"
assert sorted([p["id"] for p in people]) == sorted(
[str(created_people["p1"].uuid), str(created_people["p3"].uuid)]
)
# breakdown dau
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequestBreakdown(
date_from="-14d",
display="ActionsLineGraphCumulative",
breakdown="key",
breakdown_type="event",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
)
data_response = get_trends_time_series_ok(self.client, request, self.team)
people = get_people_from_url_ok(self.client, data_response["$pageview - val"]["2012-01-14"].person_url)
assert data_response["$pageview - val"]["2012-01-13"].value == 1
assert data_response["$pageview - val"]["2012-01-13"].breakdown_value == "val"
assert data_response["$pageview - val"]["2012-01-14"].value == 2
assert data_response["$pageview - val"]["2012-01-14"].label == "14-Jan-2012"
assert sorted([p["id"] for p in people]) == sorted(
[str(created_people["p1"].uuid), str(created_people["p3"].uuid)]
)
@also_test_with_materialized_columns(["key"])
def test_breakdown_with_filter(self):
events_by_person = {
"person1": [{"event": "sign up", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "val"}}],
"person2": [{"event": "sign up", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "oh"}}],
}
created_people = journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
params = TrendsRequestBreakdown(
date_from="-14d",
breakdown="key",
events=[{"id": "sign up", "name": "sign up", "type": "events", "order": 0}],
properties=[{"key": "key", "value": "oh", "operator": "not_icontains"}],
)
data_response = get_trends_time_series_ok(self.client, params, self.team)
person_response = get_people_from_url_ok(
self.client, data_response["sign up - val"]["2012-01-13"].person_url
)
assert data_response["sign up - val"]["2012-01-13"].value == 1
assert data_response["sign up - val"]["2012-01-13"].breakdown_value == "val"
assert sorted([p["id"] for p in person_response]) == sorted([str(created_people["person1"].uuid)])
with freeze_time("2012-01-15T04:01:34.000Z"):
params = TrendsRequestBreakdown(
date_from="-14d",
breakdown="key",
display="ActionsPie",
events=[{"id": "sign up", "name": "sign up", "type": "events", "order": 0}],
)
aggregate_response = get_trends_aggregate_ok(self.client, params, self.team)
aggregate_person_response = get_people_from_url_ok(
self.client, aggregate_response["sign up - val"].person_url
)
assert aggregate_response["sign up - val"].value == 1
assert sorted([p["id"] for p in aggregate_person_response]) == sorted([str(created_people["person1"].uuid)])
def test_insight_trends_compare(self):
events_by_person = {
"p1": [
{"event": "$pageview", "timestamp": datetime(2012, 1, 5, 3), "properties": {"key": "val"}},
{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3), "properties": {"key": "val"}},
],
"p2": [
{"event": "$pageview", "timestamp": datetime(2012, 1, 5, 3), "properties": {"key": "notval"}},
{"event": "$pageview", "timestamp": datetime(2012, 1, 14, 3), "properties": {"key": "notval"}},
],
}
created_people = journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-7d",
compare=True,
events=[{"id": "$pageview", "name": "$pageview", "type": "events", "order": 0}],
)
data_response = get_trends_time_series_ok(self.client, request, self.team)
assert data_response["$pageview - current"]["2012-01-13"].value == 0
assert data_response["$pageview - current"]["2012-01-14"].value == 2
assert data_response["$pageview - previous"]["2012-01-04"].value == 0
assert data_response["$pageview - previous"]["2012-01-05"].value == 2
with freeze_time("2012-01-15T04:01:34.000Z"):
curr_people = get_people_from_url_ok(
self.client, data_response["$pageview - current"]["2012-01-14"].person_url
)
prev_people = get_people_from_url_ok(
self.client, data_response["$pageview - previous"]["2012-01-05"].person_url
)
assert sorted([p["id"] for p in curr_people]) == sorted(
[str(created_people["p1"].uuid), str(created_people["p2"].uuid)]
)
assert sorted([p["id"] for p in prev_people]) == sorted(
[str(created_people["p1"].uuid), str(created_people["p2"].uuid)]
)
class ClickhouseTestTrendsGroups(ClickhouseTestMixin, LicensedTestMixin, APIBaseTest):
maxDiff = None
CLASS_DATA_LEVEL_SETUP = False
def _create_groups(self):
GroupTypeMapping.objects.create(team=self.team, group_type="organization", group_type_index=0)
GroupTypeMapping.objects.create(team=self.team, group_type="company", group_type_index=1)
create_group(team_id=self.team.pk, group_type_index=0, group_key="org:5", properties={"industry": "finance"})
create_group(team_id=self.team.pk, group_type_index=0, group_key="org:6", properties={"industry": "technology"})
create_group(team_id=self.team.pk, group_type_index=0, group_key="org:7", properties={"industry": "finance"})
create_group(
team_id=self.team.pk, group_type_index=1, group_key="company:10", properties={"industry": "finance"}
)
@snapshot_clickhouse_queries
def test_aggregating_by_group(self):
self._create_groups()
events_by_person = {
"person1": [
{"event": "$pageview", "timestamp": datetime(2020, 1, 2, 12), "properties": {"$group_0": "org:5"}},
{"event": "$pageview", "timestamp": datetime(2020, 1, 2, 12), "properties": {"$group_0": "org:6"}},
{
"event": "$pageview",
"timestamp": datetime(2020, 1, 2, 12),
"properties": {"$group_0": "org:6", "$group_1": "company:10"},
},
]
}
journeys_for(events_by_person, self.team)
request = TrendsRequest(
date_from="2020-01-01 00:00:00",
date_to="2020-01-12 00:00:00",
events=[
{"id": "$pageview", "type": "events", "order": 0, "math": "unique_group", "math_group_type_index": 0}
],
)
data_response = get_trends_time_series_ok(self.client, request, self.team)
assert data_response["$pageview"]["2020-01-01"].value == 0
assert data_response["$pageview"]["2020-01-02"].value == 2
curr_people = get_people_from_url_ok(self.client, data_response["$pageview"]["2020-01-02"].person_url)
assert sorted([p["group_key"] for p in curr_people]) == sorted(["org:5", "org:6"])
@snapshot_clickhouse_queries
def test_aggregating_by_session(self):
events_by_person = {
"person1": [
{"event": "$pageview", "timestamp": datetime(2020, 1, 1, 12), "properties": {"$session_id": "1"}},
{"event": "$pageview", "timestamp": datetime(2020, 1, 1, 12), "properties": {"$session_id": "1"}},
{"event": "$pageview", "timestamp": datetime(2020, 1, 2, 12), "properties": {"$session_id": "2"}},
],
"person2": [
{"event": "$pageview", "timestamp": datetime(2020, 1, 2, 12), "properties": {"$session_id": "3"}}
],
}
journeys_for(events_by_person, self.team)
request = TrendsRequest(
date_from="2020-01-01 00:00:00",
date_to="2020-01-12 00:00:00",
events=[{"id": "$pageview", "type": "events", "order": 0, "math": "unique_session"}],
)
data_response = get_trends_time_series_ok(self.client, request, self.team)
assert data_response["$pageview"]["2020-01-01"].value == 1
assert data_response["$pageview"]["2020-01-02"].value == 2
curr_people = get_people_from_url_ok(self.client, data_response["$pageview"]["2020-01-02"].person_url)
assert sorted([p["distinct_ids"][0] for p in curr_people]) == sorted(["person1", "person2"])
class ClickhouseTestTrendsCaching(ClickhouseTestMixin, LicensedTestMixin, APIBaseTest):
maxDiff = None
CLASS_DATA_LEVEL_SETUP = False
@snapshot_clickhouse_queries
def test_insight_trends_merging(self):
set_instance_setting("STRICT_CACHING_TEAMS", "all")
events_by_person = {
"1": [{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3)}],
"2": [{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3)}],
}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$pageview"]["2012-01-13"].value == 2
assert data["$pageview"]["2012-01-14"].value == 0
assert data["$pageview"]["2012-01-15"].value == 0
events_by_person = {"1": [{"event": "$pageview", "timestamp": datetime(2012, 1, 15, 3)}]}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
refresh=True,
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$pageview"]["2012-01-13"].value == 2
assert data["$pageview"]["2012-01-14"].value == 0
assert data["$pageview"]["2012-01-15"].value == 1
def test_insight_trends_merging_multiple(self):
set_instance_setting("STRICT_CACHING_TEAMS", "all")
events_by_person = {
"1": [
{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3)},
{"event": "$action", "timestamp": datetime(2012, 1, 13, 3)},
],
"2": [
{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3)},
{"event": "$action", "timestamp": datetime(2012, 1, 13, 3)},
],
}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
},
{
"id": "$action",
"math": "dau",
"name": "$action",
"custom_name": None,
"type": "events",
"order": 1,
"properties": [],
"math_property": None,
},
],
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$pageview"]["2012-01-13"].value == 2
assert data["$pageview"]["2012-01-14"].value == 0
assert data["$pageview"]["2012-01-15"].value == 0
assert data["$action"]["2012-01-13"].value == 2
assert data["$action"]["2012-01-14"].value == 0
assert data["$action"]["2012-01-15"].value == 0
events_by_person = {
"1": [
{"event": "$pageview", "timestamp": datetime(2012, 1, 15, 3)},
{"event": "$action", "timestamp": datetime(2012, 1, 15, 3)},
],
"3": [ # thhis won't be counted
{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3)},
{"event": "$action", "timestamp": datetime(2012, 1, 13, 3)},
],
}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
},
{
"id": "$action",
"math": "dau",
"name": "$action",
"custom_name": None,
"type": "events",
"order": 1,
"properties": [],
"math_property": None,
},
],
refresh=True,
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$pageview"]["2012-01-13"].value == 2
assert data["$pageview"]["2012-01-14"].value == 0
assert data["$pageview"]["2012-01-15"].value == 1
assert data["$action"]["2012-01-13"].value == 2
assert data["$action"]["2012-01-14"].value == 0
assert data["$action"]["2012-01-15"].value == 1
@skip("Don't handle breakdowns right now")
def test_insight_trends_merging_breakdown(self):
set_instance_setting("STRICT_CACHING_TEAMS", "all")
events_by_person = {
"1": [
{"event": "$action", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "1"}},
{"event": "$action", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "2"}},
],
"2": [{"event": "$action", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "1"}}],
}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequestBreakdown(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$action",
"math": "dau",
"name": "$action",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
breakdown="key",
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$action - 1"]["2012-01-13"].value == 2
assert data["$action - 1"]["2012-01-14"].value == 0
assert data["$action - 1"]["2012-01-15"].value == 0
assert data["$action - 2"]["2012-01-13"].value == 1
assert data["$action - 2"]["2012-01-14"].value == 0
assert data["$action - 2"]["2012-01-15"].value == 0
events_by_person = {
"1": [{"event": "$action", "timestamp": datetime(2012, 1, 15, 3), "properties": {"key": "2"}}],
"2": [
{"event": "$action", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "2"}}
], # this won't be counted
}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequestBreakdown(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$action",
"math": "dau",
"name": "$action",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
breakdown="key",
refresh=True,
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$action - 1"]["2012-01-13"].value == 2
assert data["$action - 1"]["2012-01-14"].value == 0
assert data["$action - 1"]["2012-01-15"].value == 0
assert data["$action - 2"]["2012-01-13"].value == 1
assert data["$action - 2"]["2012-01-14"].value == 0
assert data["$action - 2"]["2012-01-15"].value == 1
@skip("Don't handle breakdowns right now")
def test_insight_trends_merging_breakdown_multiple(self):
set_instance_setting("STRICT_CACHING_TEAMS", "all")
events_by_person = {
"1": [
{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "1"}},
{"event": "$action", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "1"}},
{"event": "$action", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "2"}},
],
"2": [
{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "1"}},
{"event": "$action", "timestamp": datetime(2012, 1, 13, 3), "properties": {"key": "1"}},
],
}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequestBreakdown(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
},
{
"id": "$action",
"math": "dau",
"name": "$action",
"custom_name": None,
"type": "events",
"order": 1,
"properties": [],
"math_property": None,
},
],
breakdown="key",
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$pageview - 1"]["2012-01-13"].value == 2
assert data["$pageview - 1"]["2012-01-14"].value == 0
assert data["$pageview - 1"]["2012-01-15"].value == 0
assert data["$action - 1"]["2012-01-13"].value == 2
assert data["$action - 1"]["2012-01-14"].value == 0
assert data["$action - 1"]["2012-01-15"].value == 0
assert data["$action - 2"]["2012-01-13"].value == 1
assert data["$action - 2"]["2012-01-14"].value == 0
assert data["$action - 2"]["2012-01-15"].value == 0
events_by_person = {
"1": [
{"event": "$pageview", "timestamp": datetime(2012, 1, 15, 3), "properties": {"key": "1"}},
{"event": "$action", "timestamp": datetime(2012, 1, 15, 3), "properties": {"key": "2"}},
],
"2": [
{
"event": "$action",
"timestamp": datetime(2012, 1, 13, 3),
"properties": {"key": "2"},
} # this won't be counted
],
}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-15T04:01:34.000Z"):
request = TrendsRequestBreakdown(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
},
{
"id": "$action",
"math": "dau",
"name": "$action",
"custom_name": None,
"type": "events",
"order": 1,
"properties": [],
"math_property": None,
},
],
breakdown="key",
refresh=True,
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$pageview - 1"]["2012-01-13"].value == 2
assert data["$pageview - 1"]["2012-01-14"].value == 0
assert data["$pageview - 1"]["2012-01-15"].value == 1
assert data["$action - 1"]["2012-01-13"].value == 2
assert data["$action - 1"]["2012-01-14"].value == 0
assert data["$action - 1"]["2012-01-15"].value == 0
assert data["$action - 2"]["2012-01-13"].value == 1
assert data["$action - 2"]["2012-01-14"].value == 0
assert data["$action - 2"]["2012-01-15"].value == 1
# When the latest time interval in the cached result doesn't match the current interval, do not use caching pattern
@snapshot_clickhouse_queries
def test_insight_trends_merging_skipped_interval(self):
set_instance_setting("STRICT_CACHING_TEAMS", "all")
events_by_person = {
"1": [{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3)}],
"2": [{"event": "$pageview", "timestamp": datetime(2012, 1, 13, 3)}],
}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-14T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$pageview"]["2012-01-13"].value == 2
assert data["$pageview"]["2012-01-14"].value == 0
events_by_person = {
"1": [{"event": "$pageview", "timestamp": datetime(2012, 1, 15, 3)}],
"2": [{"event": "$pageview", "timestamp": datetime(2012, 1, 16, 3)}],
}
journeys_for(events_by_person, self.team)
with freeze_time("2012-01-16T04:01:34.000Z"):
request = TrendsRequest(
date_from="-14d",
display="ActionsLineGraph",
events=[
{
"id": "$pageview",
"math": "dau",
"name": "$pageview",
"custom_name": None,
"type": "events",
"order": 0,
"properties": [],
"math_property": None,
}
],
refresh=True,
)
data = get_trends_time_series_ok(self.client, request, self.team)
assert data["$pageview"]["2012-01-13"].value == 2
assert data["$pageview"]["2012-01-14"].value == 0
assert data["$pageview"]["2012-01-15"].value == 1
assert data["$pageview"]["2012-01-16"].value == 1