Skip to content

Instantly share code, notes, and snippets.

@zdenekzed
Forked from ToddKerpelman/0_BigQuery_Recipes.md
Created August 27, 2019 17:04
Show Gist options
  • Save zdenekzed/0f10c103ffe28ff8e81d20a536f2f8ac to your computer and use it in GitHub Desktop.
Save zdenekzed/0f10c103ffe28ff8e81d20a536f2f8ac to your computer and use it in GitHub Desktop.

Revisions

  1. Todd Kerpelman revised this gist Jul 20, 2018. 1 changed file with 1 addition and 2 deletions.
    3 changes: 1 addition & 2 deletions 0_BigQuery_Recipes.md
    Original file line number Diff line number Diff line change
    @@ -1,8 +1,7 @@
    A handful of BigQuery SQL queries that you can use to analyze your own Google Analytics for Firebase data.
    To find out more about how they work, check out our presentation from Cloud Next 2018 (Video link to be added soon)

    Please note that these scripts have been updated to make sure of the [new Firebase schema,]
    (https://support.google.com/firebase/answer/7029846) which was rolled out to Analytics products in July of 2018.
    Please note that these scripts have been updated to make sure of the [new Firebase schema,](https://support.google.com/firebase/answer/7029846) which was rolled out to Analytics products in July of 2018.

    Note that none of these scripts will work out of the box -- you'll need to update the values in brackets
    with the names of your actual datasets, and you'll most likely also need to replace the names of events
  2. Todd Kerpelman revised this gist Jul 20, 2018. 7 changed files with 50 additions and 53 deletions.
    3 changes: 2 additions & 1 deletion 0_BigQuery_Recipes.md
    Original file line number Diff line number Diff line change
    @@ -1,7 +1,8 @@
    A handful of BigQuery SQL queries that you can use to analyze your own Google Analytics for Firebase data.
    To find out more about how they work, check out our presentation from Cloud Next 2018 (Video link to be added soon)

    Please note that these scripts have been updated to make sure of the [new Firebase schema],(https://support.google.com/firebase/answer/7029846) which was rolled out to Analytics products in July of 2018.
    Please note that these scripts have been updated to make sure of the [new Firebase schema,]
    (https://support.google.com/firebase/answer/7029846) which was rolled out to Analytics products in July of 2018.

    Note that none of these scripts will work out of the box -- you'll need to update the values in brackets
    with the names of your actual datasets, and you'll most likely also need to replace the names of events
    2 changes: 1 addition & 1 deletion 3_filter_one_event_parameter_by_another.sql
    Original file line number Diff line number Diff line change
    @@ -13,7 +13,7 @@ FROM (
    (SELECT value.int_value FROM UNNEST(event_params) WHERE key = "score") AS score,
    (SELECT value.string_value FROM UNNEST(event_params) WHERE key = "type_of_game") AS type_of_game
    FROM
    `<dataset>.events_<date>`,
    `<dataset>.events_<date>`
    WHERE
    event_name = "round_completed" )
    GROUP BY
    15 changes: 7 additions & 8 deletions 4_filter_by_range_of_userprop_values.sql
    Original file line number Diff line number Diff line change
    @@ -8,18 +8,17 @@ SELECT
    AVG(score)
    FROM (
    SELECT
    event.name,
    event_name,
    param.value.int_value AS score,
    CAST(user_prop.value.value.string_value AS int64) AS xp
    CAST(user_prop.value.string_value AS int64) AS xp
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param,
    UNNEST(user_dim.user_properties) AS user_prop
    `<dataset>.events_<date>`,
    UNNEST(event_params) AS param,
    UNNEST(user_properties) AS user_prop
    WHERE
    event.name = "round_completed"
    event_name = "round_completed"
    AND param.key = "score"
    AND user_prop.key = "xp" )
    WHERE
    xp > 15000
    OR xp < 25000
    AND xp < 25000
    16 changes: 8 additions & 8 deletions 5_filter_by_two_user_properties_at_once.sql
    Original file line number Diff line number Diff line change
    @@ -4,6 +4,7 @@
    # (in this case, is_spender and how many power-ups they have). This is how you'd do it. Note that the case statement
    # at the top isn't really necessary if you have a user property that doesn't have too many values.


    SELECT
    AVG(score) AS avg_score,
    spender,
    @@ -13,18 +14,17 @@ SELECT
    END AS powers_txt
    FROM (
    SELECT
    event.name,
    (SELECT value.int_value FROM UNNEST(event.params) WHERE key = "score") AS score,
    (SELECT value.value.string_value FROM UNNEST(user_dim.user_properties) WHERE key = "is_spender") AS spender,
    (SELECT CAST(value.value.string_value AS int64) FROM UNNEST(user_dim.user_properties) WHERE key = "powers") AS powers
    event_name,
    (SELECT value.int_value FROM UNNEST(event_params) WHERE key = "score") AS score,
    (SELECT value.string_value FROM UNNEST(user_properties) WHERE key = "is_spender") AS spender,
    (SELECT CAST(value.string_value AS int64) FROM UNNEST(user_properties) WHERE key = "powers") AS powers
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event
    `<dataset>.events_<date>`
    WHERE
    event.name = "round_completed" )
    event_name = "round_completed" )
    GROUP BY
    spender,
    powers_txt
    ORDER BY
    spender,
    powers_txt
    powers_txt
    16 changes: 7 additions & 9 deletions 6_spend_currency.sql
    Original file line number Diff line number Diff line change
    @@ -4,24 +4,22 @@
    # Make sure you replace "spend_virtual_currency" down near the bottom there with the actual
    # event you're trying to target

    #standardSQL
    SELECT
    s0,
    s1,
    s2,
    COUNT(*) AS count
    FROM (
    SELECT
    user_dim.app_info.app_instance_id AS app_instance,
    event.timestamp_micros AS event_timestamp,
    event.name AS s0,
    LEAD (event.name, 1) OVER (PARTITION BY user_dim.app_info.app_instance_id ORDER BY event.timestamp_micros) AS s1,
    LEAD (event.name, 2) OVER (PARTITION BY user_dim.app_info.app_instance_id ORDER BY event.timestamp_micros) AS s2
    user_pseudo_id,
    event_timestamp,
    event_name AS s0,
    LEAD (event_name, 1) OVER (PARTITION BY user_pseudo_id ORDER BY event_timestamp) AS s1,
    LEAD (event_name, 2) OVER (PARTITION BY user_pseudo_id ORDER BY event_timestamp) AS s2
    FROM
    `<my_dataset_.app_events_<date>`,
    UNNEST(event_dim) AS event
    `<dataset>.events_<date>`
    ORDER BY
    app_instance,
    user_pseudo_id,
    event_timestamp )
    WHERE
    s2 = "spend_virtual_currency"
    17 changes: 8 additions & 9 deletions 7_common_screen_patterns.sql
    Original file line number Diff line number Diff line change
    @@ -10,20 +10,19 @@ SELECT
    COUNT(*) AS count
    FROM (
    SELECT
    user_dim.app_info.app_instance_id AS app_instance,
    event.timestamp_micros AS event_timestamp,
    user_pseudo_id,
    event_timestamp,
    param.value.string_value AS screen_0,
    LEAD (param.value.string_value, 1) OVER (PARTITION BY user_dim.app_info.app_instance_id ORDER BY event.timestamp_micros) AS screen_1,
    LEAD (param.value.string_value, 2) OVER (PARTITION BY user_dim.app_info.app_instance_id ORDER BY event.timestamp_micros) AS screen_2
    LEAD (param.value.string_value, 1) OVER (PARTITION BY user_pseudo_id ORDER BY event_timestamp ) AS screen_1,
    LEAD (param.value.string_value, 2) OVER (PARTITION BY user_pseudo_id ORDER BY event_timestamp ) AS screen_2
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param
    `<dataset>.events_<date>`,
    UNNEST(event_params) AS param
    WHERE
    event.name = "screen_view"
    event_name = "screen_view"
    AND param.key = "firebase_screen_class"
    ORDER BY
    app_instance,
    user_pseudo_id,
    event_timestamp )
    WHERE
    screen_1 IS NOT NULL
    34 changes: 17 additions & 17 deletions 8_closed_funnel_with_time_constraints.sql
    Original file line number Diff line number Diff line change
    @@ -2,34 +2,34 @@

    # A closed funnel with time constraints!
    # Count the number of occurrences a user encountered a "start_event" event, and then the number of times
    # they encountered an "end_event" event after pre
    # they encountered an "end_event" event after encountering the start event within a certain time window (4
    # hours, in this example.)

    SELECT
    COUNTIF(funnel_start_time IS NOT NULL) AS funnel_begin_count,
    COUNTIF(funnel_end_time - funnel_start_time < 4 * 60 * 60 * 1000 * 1000) AS funnel_end_count
    FROM (
    SELECT
    funnel_start_time,
    LEAD(funnel_end_time, 1) OVER (PARTITION BY app_instance_id ORDER BY event_time) AS funnel_end_time
    LEAD(funnel_end_time, 1) OVER (PARTITION BY user_pseudo_id ORDER BY event_timestamp) AS funnel_end_time
    FROM (
    SELECT
    event.name,
    IF (event.name = "start_event",
    event.timestamp_micros,
    event_name,
    IF (event_name = "start_event",
    event_timestamp,
    NULL) AS funnel_start_time,
    IF (event.name = "end_event",
    event.timestamp_micros,
    IF (event_name = "end_event",
    event_timestamp,
    NULL) AS funnel_end_time,
    user_dim.app_info.app_instance_id,
    event.timestamp_micros AS event_time
    user_pseudo_id,
    event_timestamp
    FROM
    `<dataset>.app_events_*`,
    UNNEST(event_dim) AS event
    # `<dataset>.events_<date>`
    WHERE
    event.name = "start_event"
    OR event.name = "end_event"
    AND _TABLE_SUFFIX BETWEEN '<date1>'
    AND '<date2>'
    event_name = "start_event"
    OR event_name = "end_event"
    AND _TABLE_SUFFIX BETWEEN '<yyyymmdd>'
    AND '<yyyymmdd>'
    ORDER BY
    app_instance_id,
    event.timestamp_micros ) )
    user_pseudo_id,
    event_timestamp) )
  3. Todd Kerpelman revised this gist Jul 20, 2018. 4 changed files with 24 additions and 23 deletions.
    8 changes: 5 additions & 3 deletions 0_BigQuery_Recipes.md
    Original file line number Diff line number Diff line change
    @@ -1,9 +1,11 @@
    A handful of BigQuery SQL queries that you can use to analyze your own Google Analytics for Firebase data.
    To find out more about how they work, check out my presentation from the Firebase Developer Conference in
    Amsterdam (video to be added soon).
    To find out more about how they work, check out our presentation from Cloud Next 2018 (Video link to be added soon)

    Please note that these scripts have been updated to make sure of the [new Firebase schema],(https://support.google.com/firebase/answer/7029846) which was rolled out to Analytics products in July of 2018.

    Note that none of these scripts will work out of the box -- you'll need to update the values in brackets
    with the names of your actual datasets, and you'll most likely also need to replace the names of events
    and event properties with ones that are appropriate for your app.

    The contents of this gist are licensed under the [Apache License, version 2.0](https://www.apache.org/licenses/LICENSE-2.0)
    The contents of this gist are licensed under the [Apache License, version 2.0](https://www.apache.org/licenses/LICENSE-2.0)

    9 changes: 4 additions & 5 deletions 1_analyze_event_param.sql
    Original file line number Diff line number Diff line change
    @@ -8,9 +8,8 @@ SELECT
    AVG(param.value.int_value) AS avg_score,
    stddev(param.value.int_value) AS stddev
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param
    `<dataset>.events_<date>`,
    UNNEST(event_params) AS param
    WHERE
    event.name = "round_completed"
    AND param.key = "score"
    event_name = "round_completed"
    AND param.key = "score"
    16 changes: 8 additions & 8 deletions 2_coorelate_event_param_and_userprop.sql
    Original file line number Diff line number Diff line change
    @@ -5,18 +5,18 @@
    # from a string to an int).

    SELECT
    corr(score, xp)
    corr(score,
    xp)
    FROM (
    SELECT
    event.name,
    event_name,
    param.value.int_value AS score,
    CAST(user_prop.value.value.string_value AS int64) AS xp
    CAST(user_prop.value.string_value AS int64) AS xp
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param,
    UNNEST(user_dim.user_properties) AS user_prop
    `<dataset>.events_<date>`,
    UNNEST(event_params) AS param,
    UNNEST(user_properties) AS user_prop
    WHERE
    event.name = "round_completed"
    event_name = "round_completed"
    AND param.key = "score"
    AND user_prop.key = "xp" )
    14 changes: 7 additions & 7 deletions 3_filter_one_event_parameter_by_another.sql
    Original file line number Diff line number Diff line change
    @@ -9,13 +9,13 @@ SELECT
    MAX(type_of_game)
    FROM (
    SELECT
    event.name,
    (SELECT value.int_value FROM UNNEST(event.params) WHERE key = "score") AS score,
    (SELECT value.string_value FROM UNNEST(event.params) WHERE key = "type_of_game") AS type_of_game
    event_name,
    (SELECT value.int_value FROM UNNEST(event_params) WHERE key = "score") AS score,
    (SELECT value.string_value FROM UNNEST(event_params) WHERE key = "type_of_game") AS type_of_game
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event
    `<dataset>.events_<date>`,
    WHERE
    event.name = "round_completed" )
    event_name = "round_completed" )
    GROUP BY
    type_of_game
    type_of_game

  4. Todd Kerpelman revised this gist Oct 26, 2017. 3 changed files with 30 additions and 35 deletions.
    16 changes: 2 additions & 14 deletions 3_filter_one_event_parameter_by_another.sql
    Original file line number Diff line number Diff line change
    @@ -10,20 +10,8 @@ SELECT
    FROM (
    SELECT
    event.name,
    (
    SELECT
    value.int_value
    FROM
    UNNEST(event.params)
    WHERE
    key = "score") AS score,
    (
    SELECT
    value.string_value
    FROM
    UNNEST(event.params)
    WHERE
    key = "type_of_game") AS type_of_game
    (SELECT value.int_value FROM UNNEST(event.params) WHERE key = "score") AS score,
    (SELECT value.string_value FROM UNNEST(event.params) WHERE key = "type_of_game") AS type_of_game
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event
    25 changes: 25 additions & 0 deletions 4_filter_by_range_of_userprop_values.sql
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,25 @@
    #standardSQL

    # Normally in the Firebase console, you can only filter your events by a single user property value. This allows you to
    # filter the property of an event (in this case the "score" value of the "round_completed" event) by a range of user
    # property values

    SELECT
    AVG(score)
    FROM (
    SELECT
    event.name,
    param.value.int_value AS score,
    CAST(user_prop.value.value.string_value AS int64) AS xp
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param,
    UNNEST(user_dim.user_properties) AS user_prop
    WHERE
    event.name = "round_completed"
    AND param.key = "score"
    AND user_prop.key = "xp" )
    WHERE
    xp > 15000
    OR xp < 25000
    24 changes: 3 additions & 21 deletions 5_filter_by_two_user_properties_at_once.sql
    Original file line number Diff line number Diff line change
    @@ -14,27 +14,9 @@ SELECT
    FROM (
    SELECT
    event.name,
    (
    SELECT
    value.int_value
    FROM
    UNNEST(event.params)
    WHERE
    key = "score") AS score,
    (
    SELECT
    value.value.string_value
    FROM
    UNNEST(user_dim.user_properties)
    WHERE
    key = "is_spender") AS spender,
    (
    SELECT
    CAST(value.value.string_value AS int64)
    FROM
    UNNEST(user_dim.user_properties)
    WHERE
    key = "powers") AS powers
    (SELECT value.int_value FROM UNNEST(event.params) WHERE key = "score") AS score,
    (SELECT value.value.string_value FROM UNNEST(user_dim.user_properties) WHERE key = "is_spender") AS spender,
    (SELECT CAST(value.value.string_value AS int64) FROM UNNEST(user_dim.user_properties) WHERE key = "powers") AS powers
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event
  5. Todd Kerpelman revised this gist Oct 26, 2017. 1 changed file with 0 additions and 1 deletion.
    1 change: 0 additions & 1 deletion LICENSE
    Original file line number Diff line number Diff line change
    @@ -1,4 +1,3 @@
    KB

    Apache License
    Version 2.0, January 2004
  6. Todd Kerpelman renamed this gist Oct 26, 2017. 1 changed file with 0 additions and 0 deletions.
    File renamed without changes.
  7. Todd Kerpelman revised this gist Oct 26, 2017. 9 changed files with 21 additions and 45 deletions.
    16 changes: 16 additions & 0 deletions 1_analyze_event_param.sql
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,16 @@
    #standardSQL

    # This query will get the average and standard deviation of a "score" parameter that's part of a
    # "round_completed" event. Feel free to replace these values to match events and parameters that are
    # already in your app.

    SELECT
    AVG(param.value.int_value) AS avg_score,
    stddev(param.value.int_value) AS stddev
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param
    WHERE
    event.name = "round_completed"
    AND param.key = "score"
    File renamed without changes.
    File renamed without changes.
    6 changes: 5 additions & 1 deletion BigQuery Recipes.md
    Original file line number Diff line number Diff line change
    @@ -2,4 +2,8 @@ A handful of BigQuery SQL queries that you can use to analyze your own Google An
    To find out more about how they work, check out my presentation from the Firebase Developer Conference in
    Amsterdam (video to be added soon).

    The contents of this gist is licensed under the [Apache License, version 2.0](https://www.apache.org/licenses/LICENSE-2.0)
    Note that none of these scripts will work out of the box -- you'll need to update the values in brackets
    with the names of your actual datasets, and you'll most likely also need to replace the names of events
    and event properties with ones that are appropriate for your app.

    The contents of this gist are licensed under the [Apache License, version 2.0](https://www.apache.org/licenses/LICENSE-2.0)
    44 changes: 0 additions & 44 deletions analyze_event_param.sql
    Original file line number Diff line number Diff line change
    @@ -1,44 +0,0 @@
    #standardSQL

    # This query will get the average and standard deviation of a "score" parameter that's part of a
    # "round_completed" event. Feel free to replace these values to match events and parameters that are
    # already in your app.

    SELECT
    AVG(param.value.int_value) AS avg_score,
    stddev(param.value.int_value) AS stddev
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param
    WHERE
    event.name = "round_completed"
    AND param.key = "score"

    #standardSQL

    # Get the correlation between one event parameter (in this case, the "score" parameter of the
    # "round_completed" event and a user property (in this case, the "xp" user property, converted
    # from a string to an int).

    SELECT
    corr(score, xp)
    FROM (
    SELECT
    event.name,
    param.value.int_value AS score,
    CAST(user_prop.value.value.string_value AS int64) AS xp
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param,
    UNNEST(user_dim.user_properties) AS user_prop
    WHERE
    event.name = "round_completed"
    AND param.key = "score"
    AND user_prop.key = "xp" )
    @ToddKerpelman



    Write
  8. Todd Kerpelman renamed this gist Oct 26, 2017. 1 changed file with 0 additions and 0 deletions.
    File renamed without changes.
  9. Todd Kerpelman revised this gist Oct 26, 2017. 1 changed file with 5 additions and 0 deletions.
    5 changes: 5 additions & 0 deletions _BigQuery Recipes.md
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,5 @@
    A handful of BigQuery SQL queries that you can use to analyze your own Google Analytics for Firebase data.
    To find out more about how they work, check out my presentation from the Firebase Developer Conference in
    Amsterdam (video to be added soon).

    The contents of this gist is licensed under the [Apache License, version 2.0](https://www.apache.org/licenses/LICENSE-2.0)
  10. Todd Kerpelman created this gist Oct 26, 2017.
    203 changes: 203 additions & 0 deletions LICENSE
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,203 @@
    KB

    Apache License
    Version 2.0, January 2004
    http://www.apache.org/licenses/

    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

    1. Definitions.

    "License" shall mean the terms and conditions for use, reproduction,
    and distribution as defined by Sections 1 through 9 of this document.

    "Licensor" shall mean the copyright owner or entity authorized by
    the copyright owner that is granting the License.

    "Legal Entity" shall mean the union of the acting entity and all
    other entities that control, are controlled by, or are under common
    control with that entity. For the purposes of this definition,
    "control" means (i) the power, direct or indirect, to cause the
    direction or management of such entity, whether by contract or
    otherwise, or (ii) ownership of fifty percent (50%) or more of the
    outstanding shares, or (iii) beneficial ownership of such entity.

    "You" (or "Your") shall mean an individual or Legal Entity
    exercising permissions granted by this License.

    "Source" form shall mean the preferred form for making modifications,
    including but not limited to software source code, documentation
    source, and configuration files.

    "Object" form shall mean any form resulting from mechanical
    transformation or translation of a Source form, including but
    not limited to compiled object code, generated documentation,
    and conversions to other media types.

    "Work" shall mean the work of authorship, whether in Source or
    Object form, made available under the License, as indicated by a
    copyright notice that is included in or attached to the work
    (an example is provided in the Appendix below).

    "Derivative Works" shall mean any work, whether in Source or Object
    form, that is based on (or derived from) the Work and for which the
    editorial revisions, annotations, elaborations, or other modifications
    represent, as a whole, an original work of authorship. For the purposes
    of this License, Derivative Works shall not include works that remain
    separable from, or merely link (or bind by name) to the interfaces of,
    the Work and Derivative Works thereof.

    "Contribution" shall mean any work of authorship, including
    the original version of the Work and any modifications or additions
    to that Work or Derivative Works thereof, that is intentionally
    submitted to Licensor for inclusion in the Work by the copyright owner
    or by an individual or Legal Entity authorized to submit on behalf of
    the copyright owner. For the purposes of this definition, "submitted"
    means any form of electronic, verbal, or written communication sent
    to the Licensor or its representatives, including but not limited to
    communication on electronic mailing lists, source code control systems,
    and issue tracking systems that are managed by, or on behalf of, the
    Licensor for the purpose of discussing and improving the Work, but
    excluding communication that is conspicuously marked or otherwise
    designated in writing by the copyright owner as "Not a Contribution."

    "Contributor" shall mean Licensor and any individual or Legal Entity
    on behalf of whom a Contribution has been received by Licensor and
    subsequently incorporated within the Work.

    2. Grant of Copyright License. Subject to the terms and conditions of
    this License, each Contributor hereby grants to You a perpetual,
    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
    copyright license to reproduce, prepare Derivative Works of,
    publicly display, publicly perform, sublicense, and distribute the
    Work and such Derivative Works in Source or Object form.

    3. Grant of Patent License. Subject to the terms and conditions of
    this License, each Contributor hereby grants to You a perpetual,
    worldwide, non-exclusive, no-charge, royalty-free, irrevocable
    (except as stated in this section) patent license to make, have made,
    use, offer to sell, sell, import, and otherwise transfer the Work,
    where such license applies only to those patent claims licensable
    by such Contributor that are necessarily infringed by their
    Contribution(s) alone or by combination of their Contribution(s)
    with the Work to which such Contribution(s) was submitted. If You
    institute patent litigation against any entity (including a
    cross-claim or counterclaim in a lawsuit) alleging that the Work
    or a Contribution incorporated within the Work constitutes direct
    or contributory patent infringement, then any patent licenses
    granted to You under this License for that Work shall terminate
    as of the date such litigation is filed.

    4. Redistribution. You may reproduce and distribute copies of the
    Work or Derivative Works thereof in any medium, with or without
    modifications, and in Source or Object form, provided that You
    meet the following conditions:

    (a) You must give any other recipients of the Work or
    Derivative Works a copy of this License; and

    (b) You must cause any modified files to carry prominent notices
    stating that You changed the files; and

    (c) You must retain, in the Source form of any Derivative Works
    that You distribute, all copyright, patent, trademark, and
    attribution notices from the Source form of the Work,
    excluding those notices that do not pertain to any part of
    the Derivative Works; and

    (d) If the Work includes a "NOTICE" text file as part of its
    distribution, then any Derivative Works that You distribute must
    include a readable copy of the attribution notices contained
    within such NOTICE file, excluding those notices that do not
    pertain to any part of the Derivative Works, in at least one
    of the following places: within a NOTICE text file distributed
    as part of the Derivative Works; within the Source form or
    documentation, if provided along with the Derivative Works; or,
    within a display generated by the Derivative Works, if and
    wherever such third-party notices normally appear. The contents
    of the NOTICE file are for informational purposes only and
    do not modify the License. You may add Your own attribution
    notices within Derivative Works that You distribute, alongside
    or as an addendum to the NOTICE text from the Work, provided
    that such additional attribution notices cannot be construed
    as modifying the License.

    You may add Your own copyright statement to Your modifications and
    may provide additional or different license terms and conditions
    for use, reproduction, or distribution of Your modifications, or
    for any such Derivative Works as a whole, provided Your use,
    reproduction, and distribution of the Work otherwise complies with
    the conditions stated in this License.

    5. Submission of Contributions. Unless You explicitly state otherwise,
    any Contribution intentionally submitted for inclusion in the Work
    by You to the Licensor shall be under the terms and conditions of
    this License, without any additional terms or conditions.
    Notwithstanding the above, nothing herein shall supersede or modify
    the terms of any separate license agreement you may have executed
    with Licensor regarding such Contributions.

    6. Trademarks. This License does not grant permission to use the trade
    names, trademarks, service marks, or product names of the Licensor,
    except as required for reasonable and customary use in describing the
    origin of the Work and reproducing the content of the NOTICE file.

    7. Disclaimer of Warranty. Unless required by applicable law or
    agreed to in writing, Licensor provides the Work (and each
    Contributor provides its Contributions) on an "AS IS" BASIS,
    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
    implied, including, without limitation, any warranties or conditions
    of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
    PARTICULAR PURPOSE. You are solely responsible for determining the
    appropriateness of using or redistributing the Work and assume any
    risks associated with Your exercise of permissions under this License.

    8. Limitation of Liability. In no event and under no legal theory,
    whether in tort (including negligence), contract, or otherwise,
    unless required by applicable law (such as deliberate and grossly
    negligent acts) or agreed to in writing, shall any Contributor be
    liable to You for damages, including any direct, indirect, special,
    incidental, or consequential damages of any character arising as a
    result of this License or out of the use or inability to use the
    Work (including but not limited to damages for loss of goodwill,
    work stoppage, computer failure or malfunction, or any and all
    other commercial damages or losses), even if such Contributor
    has been advised of the possibility of such damages.

    9. Accepting Warranty or Additional Liability. While redistributing
    the Work or Derivative Works thereof, You may choose to offer,
    and charge a fee for, acceptance of support, warranty, indemnity,
    or other liability obligations and/or rights consistent with this
    License. However, in accepting such obligations, You may act only
    on Your own behalf and on Your sole responsibility, not on behalf
    of any other Contributor, and only if You agree to indemnify,
    defend, and hold each Contributor harmless for any liability
    incurred by, or claims asserted against, such Contributor by reason
    of your accepting any such warranty or additional liability.

    END OF TERMS AND CONDITIONS

    APPENDIX: How to apply the Apache License to your work.

    To apply the Apache License to your work, attach the following
    boilerplate notice, with the fields enclosed by brackets "[]"
    replaced with your own identifying information. (Don't include
    the brackets!) The text should be enclosed in the appropriate
    comment syntax for the file format. We also recommend that a
    file or class name and description of purpose be included on the
    same "printed page" as the copyright notice for easier
    identification within third-party archives.

    Copyright [yyyy] [name of copyright owner]

    Licensed under the Apache License, Version 2.0 (the "License");
    you may not use this file except in compliance with the License.
    You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

    Unless required by applicable law or agreed to in writing, software
    distributed under the License is distributed on an "AS IS" BASIS,
    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    See the License for the specific language governing permissions and
    limitations under the License.
    44 changes: 44 additions & 0 deletions analyze_event_param.sql
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,44 @@
    #standardSQL

    # This query will get the average and standard deviation of a "score" parameter that's part of a
    # "round_completed" event. Feel free to replace these values to match events and parameters that are
    # already in your app.

    SELECT
    AVG(param.value.int_value) AS avg_score,
    stddev(param.value.int_value) AS stddev
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param
    WHERE
    event.name = "round_completed"
    AND param.key = "score"

    #standardSQL

    # Get the correlation between one event parameter (in this case, the "score" parameter of the
    # "round_completed" event and a user property (in this case, the "xp" user property, converted
    # from a string to an int).

    SELECT
    corr(score, xp)
    FROM (
    SELECT
    event.name,
    param.value.int_value AS score,
    CAST(user_prop.value.value.string_value AS int64) AS xp
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param,
    UNNEST(user_dim.user_properties) AS user_prop
    WHERE
    event.name = "round_completed"
    AND param.key = "score"
    AND user_prop.key = "xp" )
    @ToddKerpelman



    Write
    35 changes: 35 additions & 0 deletions closed_funnel_with_time_constraints.sql
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,35 @@
    #standardSQL

    # A closed funnel with time constraints!
    # Count the number of occurrences a user encountered a "start_event" event, and then the number of times
    # they encountered an "end_event" event after pre

    SELECT
    COUNTIF(funnel_start_time IS NOT NULL) AS funnel_begin_count,
    COUNTIF(funnel_end_time - funnel_start_time < 4 * 60 * 60 * 1000 * 1000) AS funnel_end_count
    FROM (
    SELECT
    funnel_start_time,
    LEAD(funnel_end_time, 1) OVER (PARTITION BY app_instance_id ORDER BY event_time) AS funnel_end_time
    FROM (
    SELECT
    event.name,
    IF (event.name = "start_event",
    event.timestamp_micros,
    NULL) AS funnel_start_time,
    IF (event.name = "end_event",
    event.timestamp_micros,
    NULL) AS funnel_end_time,
    user_dim.app_info.app_instance_id,
    event.timestamp_micros AS event_time
    FROM
    `<dataset>.app_events_*`,
    UNNEST(event_dim) AS event
    WHERE
    event.name = "start_event"
    OR event.name = "end_event"
    AND _TABLE_SUFFIX BETWEEN '<date1>'
    AND '<date2>'
    ORDER BY
    app_instance_id,
    event.timestamp_micros ) )
    36 changes: 36 additions & 0 deletions common_screen_patterns.sql
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,36 @@
    #standardSQL

    # Using the new "screen_view" event being tracked by Google Analytics for Firebase, can we figure out what the most
    # common triplets of "screen progressions" are through our app?

    SELECT
    screen_0,
    screen_1,
    screen_2,
    COUNT(*) AS count
    FROM (
    SELECT
    user_dim.app_info.app_instance_id AS app_instance,
    event.timestamp_micros AS event_timestamp,
    param.value.string_value AS screen_0,
    LEAD (param.value.string_value, 1) OVER (PARTITION BY user_dim.app_info.app_instance_id ORDER BY event.timestamp_micros) AS screen_1,
    LEAD (param.value.string_value, 2) OVER (PARTITION BY user_dim.app_info.app_instance_id ORDER BY event.timestamp_micros) AS screen_2
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param
    WHERE
    event.name = "screen_view"
    AND param.key = "firebase_screen_class"
    ORDER BY
    app_instance,
    event_timestamp )
    WHERE
    screen_1 IS NOT NULL
    AND screen_2 IS NOT NULL
    GROUP BY
    screen_0,
    screen_1,
    screen_2
    ORDER BY
    count DESC
    22 changes: 22 additions & 0 deletions coorelate_event_param_and_userprop.sql
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,22 @@
    #standardSQL

    # Get the correlation between one event parameter (in this case, the "score" parameter of the
    # "round_completed" event and a user property (in this case, the "xp" user property, converted
    # from a string to an int).

    SELECT
    corr(score, xp)
    FROM (
    SELECT
    event.name,
    param.value.int_value AS score,
    CAST(user_prop.value.value.string_value AS int64) AS xp
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event,
    UNNEST(event.params) AS param,
    UNNEST(user_dim.user_properties) AS user_prop
    WHERE
    event.name = "round_completed"
    AND param.key = "score"
    AND user_prop.key = "xp" )
    48 changes: 48 additions & 0 deletions filter_by_two_user_properties_at_once.sql
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,48 @@
    # standardSQL

    # Suppose we want a side-by-side comparison of an event parameter (in this case "score") by two different user properties
    # (in this case, is_spender and how many power-ups they have). This is how you'd do it. Note that the case statement
    # at the top isn't really necessary if you have a user property that doesn't have too many values.

    SELECT
    AVG(score) AS avg_score,
    spender,
    CASE
    WHEN powers < 20 THEN 'few_powers'
    ELSE 'many_powers'
    END AS powers_txt
    FROM (
    SELECT
    event.name,
    (
    SELECT
    value.int_value
    FROM
    UNNEST(event.params)
    WHERE
    key = "score") AS score,
    (
    SELECT
    value.value.string_value
    FROM
    UNNEST(user_dim.user_properties)
    WHERE
    key = "is_spender") AS spender,
    (
    SELECT
    CAST(value.value.string_value AS int64)
    FROM
    UNNEST(user_dim.user_properties)
    WHERE
    key = "powers") AS powers
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event
    WHERE
    event.name = "round_completed" )
    GROUP BY
    spender,
    powers_txt
    ORDER BY
    spender,
    powers_txt
    33 changes: 33 additions & 0 deletions filter_one_event_parameter_by_another.sql
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,33 @@
    #standardSQL

    # Let's group one event parameter (in this case, the "score" parameter of the round_completed event)
    # with another event parameter (in this case, the "type_of_game" parameter) through the magic of
    # SELECT FROM UNNEST !

    SELECT
    AVG(score),
    MAX(type_of_game)
    FROM (
    SELECT
    event.name,
    (
    SELECT
    value.int_value
    FROM
    UNNEST(event.params)
    WHERE
    key = "score") AS score,
    (
    SELECT
    value.string_value
    FROM
    UNNEST(event.params)
    WHERE
    key = "type_of_game") AS type_of_game
    FROM
    `<dataset>.app_events_<date>`,
    UNNEST(event_dim) AS event
    WHERE
    event.name = "round_completed" )
    GROUP BY
    type_of_game
    33 changes: 33 additions & 0 deletions spend_currency.sql
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,33 @@
    #standardSQL

    # See what trio of events are leading up to a desired event within your app!
    # Make sure you replace "spend_virtual_currency" down near the bottom there with the actual
    # event you're trying to target

    #standardSQL
    SELECT
    s0,
    s1,
    s2,
    COUNT(*) AS count
    FROM (
    SELECT
    user_dim.app_info.app_instance_id AS app_instance,
    event.timestamp_micros AS event_timestamp,
    event.name AS s0,
    LEAD (event.name, 1) OVER (PARTITION BY user_dim.app_info.app_instance_id ORDER BY event.timestamp_micros) AS s1,
    LEAD (event.name, 2) OVER (PARTITION BY user_dim.app_info.app_instance_id ORDER BY event.timestamp_micros) AS s2
    FROM
    `<my_dataset_.app_events_<date>`,
    UNNEST(event_dim) AS event
    ORDER BY
    app_instance,
    event_timestamp )
    WHERE
    s2 = "spend_virtual_currency"
    GROUP BY
    s0,
    s1,
    s2
    ORDER BY
    count DESC