Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[PRSync] Create onchain_metrics_by_artifact #23

Closed
wants to merge 2 commits into from
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
16 changes: 16 additions & 0 deletions .github/workflows-recce/hello.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,16 @@
name: Hello World Workflow

on:
pull_request:
types: [opened, synchronize]

jobs:
hello-world-job:
runs-on: ubuntu-latest

steps:
- name: Checkout repository
uses: actions/checkout@v2

- name: Print Hello, World!
run: echo "Hello, World! Test permissions."
26 changes: 26 additions & 0 deletions profiles.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
opensource_observer:
outputs:
playground:
type: bigquery
method: service-account
keyfile: "{{ env_var('DBT_GOOGLE_KEYFILE') }}"
project: "{{ env_var('DBT_GOOGLE_PROJECT') }}"
dataset: "{{ env_var('DBT_GOOGLE_DATASET') }}"
job_execution_time_seconds: 300
job_retries: 1
location: US
threads: 32
dev:
type: bigquery
method: service-account
keyfile: "{{ env_var('DBT_GOOGLE_KEYFILE') }}"
project: "{{ env_var('DBT_GOOGLE_PROJECT') }}"
dataset: "{{ env_var('DBT_GOOGLE_DEV_DATASET') }}"
job_execution_time_seconds: 300
job_retries: 1
location: US
threads: 32
# By default we target the playground. it's less costly and also safer to write
# there while developing
target: playground

Original file line number Diff line number Diff line change
@@ -0,0 +1,172 @@
{#
Summary onchain metrics for a project:
- artifact_id: The unique identifier for the artifact
- network: The network the artifact is deployed on
- artifact_name: The name of the artifact
- num_contracts: The number of contracts in the artifact
- first_txn_date: The date of the first transaction to the artifact
- total_txns: The total number of transactions to the artifact
- total_l2_gas: The total L2 gas used by the artifact
- total_users: The number of unique users interacting with the artifact
- txns_6_months: The total number of transactions to the artifact in the last 6 months
- l2_gas_6_months: The total L2 gas used by the artifact in the last 6 months
- users_6_months: The number of unique users interacting with the artifact in the last 6 months
- new_users: The number of users interacting with the artifact for the first time in the last 3 months
- active_users: The number of active users interacting with the artifact in the last 3 months
- high_frequency_users: The number of users who have made 1000+ transactions with the artifact in the last 3 months
- more_active_users: The number of users who have made 10-999 transactions with the artifact in the last 3 months
- less_active_users: The number of users who have made 1-9 transactions with the artifact in the last 3 months
- multi_project_users: The number of users who have interacted with 3+ artifacts in the last 3 months
#}
{{
config(meta = {
'sync_to_cloudsql': True
})
}}


WITH txns AS (
SELECT
a.artifact_id,
a.artifact_name,
c.to_namespace AS onchain_network,
c.from_source_id AS from_id,
c.l2_gas,
c.tx_count,
DATE(TIMESTAMP_TRUNC(c.time, MONTH)) AS bucket_month
FROM {{ ref('stg_dune__contract_invocation') }} AS c
INNER JOIN {{ ref('stg_ossd__artifacts_by_project') }} AS a
ON c.to_source_id = a.artifact_source_id
),

metrics_all_time AS (
SELECT
artifact_id,
artifact_name,
onchain_network,
COUNT(DISTINCT from_id) AS total_users,
SUM(l2_gas) AS total_l2_gas,
SUM(tx_count) AS total_txns
FROM txns
GROUP BY artifact_id, artifact_name, onchain_network
),

metrics_6_months AS (
SELECT
artifact_id,
artifact_name,
onchain_network,
COUNT(DISTINCT from_id) AS users_6_months,
SUM(l2_gas) AS l2_gas_6_months,
SUM(tx_count) AS txns_6_months
FROM txns
WHERE bucket_month >= DATE_ADD(CURRENT_DATE(), INTERVAL -6 MONTH)
GROUP BY artifact_id, artifact_name, onchain_network
),

new_users AS (
SELECT
artifact_id,
artifact_name,
onchain_network,
SUM(is_new_user) AS new_user_count
FROM (
SELECT
artifact_id,
artifact_name,
onchain_network,
from_id,
CASE
WHEN MIN(bucket_month) >= DATE_ADD(CURRENT_DATE(), INTERVAL -3 MONTH) THEN 1
END AS is_new_user
FROM txns
GROUP BY artifact_id, artifact_name, onchain_network, from_id
)
GROUP BY artifact_id, artifact_name, onchain_network
),

user_segments AS (
SELECT
artifact_id,
artifact_name,
onchain_network,
COUNT(DISTINCT CASE WHEN user_segment = 'HIGH_FREQUENCY_USER' THEN from_id END) AS high_frequency_users,
COUNT(DISTINCT CASE WHEN user_segment = 'MORE_ACTIVE_USER' THEN from_id END) AS more_active_users,
COUNT(DISTINCT CASE WHEN user_segment = 'LESS_ACTIVE_USER' THEN from_id END) AS less_active_users,
COUNT(DISTINCT CASE WHEN projects_transacted_on >= 3 THEN from_id END) AS multi_project_users
FROM (
SELECT
uta.artifact_id,
uta.artifact_name,
uta.onchain_network,
uta.from_id,
mpu.projects_transacted_on,
CASE
WHEN uta.total_tx_count >= 1000 THEN 'HIGH_FREQUENCY_USER'
WHEN uta.total_tx_count >= 10 THEN 'MORE_ACTIVE_USER'
ELSE 'LESS_ACTIVE_USER'
END AS user_segment
FROM (
SELECT
artifact_id,
artifact_name,
onchain_network,
from_id,
SUM(tx_count) AS total_tx_count
FROM txns
WHERE bucket_month >= DATE_ADD(CURRENT_DATE(), INTERVAL -3 MONTH)
GROUP BY artifact_id, artifact_name, onchain_network, from_id
) AS uta
INNER JOIN (
SELECT
onchain_network,
from_id,
COUNT(DISTINCT artifact_id) AS projects_transacted_on
FROM txns
WHERE bucket_month >= DATE_ADD(CURRENT_DATE(), INTERVAL -3 MONTH)
GROUP BY onchain_network, from_id
) AS mpu ON uta.from_id = mpu.from_id
) AS user_txns_aggregated
GROUP BY artifact_id, artifact_name, onchain_network
),

contracts AS (
SELECT
artifact_id,
artifact_namespace AS onchain_network,
COUNT(artifact_source_id) AS num_contracts
FROM {{ ref('stg_ossd__artifacts_by_project') }}
GROUP BY artifact_id, artifact_namespace
),

project_by_network AS (
SELECT
a.artifact_id,
a.artifact_namespace AS onchain_network,
a.artifact_name
FROM {{ ref('stg_ossd__artifacts_by_project') }} AS a
)

SELECT
p.artifact_id,
p.onchain_network AS network,
p.artifact_name,
c.num_contracts,
ma.total_users,
ma.total_l2_gas,
ma.total_txns,
m6.users_6_months,
m6.l2_gas_6_months,
m6.txns_6_months,
nu.new_user_count,
us.high_frequency_users,
us.more_active_users,
us.less_active_users,
us.multi_project_users,
(us.high_frequency_users + us.more_active_users + us.less_active_users) AS active_users
FROM project_by_network AS p
LEFT JOIN metrics_all_time AS ma ON p.artifact_id = ma.artifact_id AND p.onchain_network = ma.onchain_network
LEFT JOIN metrics_6_months AS m6 ON p.artifact_id = m6.artifact_id AND p.onchain_network = m6.onchain_network
LEFT JOIN new_users AS nu ON p.artifact_id = nu.artifact_id AND p.onchain_network = nu.onchain_network
LEFT JOIN user_segments AS us ON p.artifact_id = us.artifact_id AND p.onchain_network = us.onchain_network
LEFT JOIN contracts AS c ON p.artifact_id = c.artifact_id AND p.onchain_network = c.onchain_network;