#1. Install Dependencies
First install the libraries needed to execute recipes, this only needs to be done once, then click play.


In [ ]:
!pip install git+https://github.com/google/starthinker


#2. Get Cloud Project ID
To run this recipe [requires a Google Cloud Project](https://github.com/google/starthinker/blob/master/tutorials/cloud_project.md), this only needs to be done once, then click play.


In [ ]:
CLOUD_PROJECT = 'PASTE PROJECT ID HERE'

print("Cloud Project Set To: %s" % CLOUD_PROJECT)


#3. Get Client Credentials
To read and write to various endpoints requires [downloading client credentials](https://github.com/google/starthinker/blob/master/tutorials/cloud_client_installed.md), this only needs to be done once, then click play.


In [ ]:
CLIENT_CREDENTIALS = 'PASTE CREDENTIALS HERE'

print("Client Credentials Set To: %s" % CLIENT_CREDENTIALS)


#4. Enter CM To BigQuery Parameters
Move existing CM report into a BigQuery table.
 1. Specify an account id.
 1. Specify either report name or report id to move a report.
 1. The most recent valid file will overwrite the table.
 1. Schema is pulled from the official CM specification.
Modify the values below for your use case, can be done multiple times, then click play.


In [ ]:
FIELDS = {
  'auth_read': 'user',  # Credentials used for reading data.
  'auth_write': 'service',  # Credentials used for writing data.
  'account': '',  # CM network id.
  'report_id': '',  # CM report id, empty if using name .
  'report_name': '',  # CM report name, empty if using id instead.
  'dataset': '',  # Dataset to be written to in BigQuery.
  'table': '',  # Table to be written to in BigQuery.
  'is_incremental_load': False,  # Clear data in destination table during this report's time period, then append report data to existing table.
}

print("Parameters Set To: %s" % FIELDS)


#5. Execute CM To BigQuery
This does NOT need to be modified unles you are changing the recipe, click play.


In [ ]:
from starthinker.util.project import project
from starthinker.script.parse import json_set_fields

USER_CREDENTIALS = '/content/user.json'

TASKS = [
  {
    'dcm': {
      'auth': 'user',
      'report': {
        'account': {'field': {'name': 'account','kind': 'integer','order': 2,'default': '','description': 'CM network id.'}},
        'report_id': {'field': {'name': 'report_id','kind': 'integer','order': 3,'default': '','description': 'CM report id, empty if using name .'}},
        'name': {'field': {'name': 'report_name','kind': 'string','order': 4,'default': '','description': 'CM report name, empty if using id instead.'}}
      },
      'out': {
        'bigquery': {
          'auth': 'user',
          'dataset': {'field': {'name': 'dataset','kind': 'string','order': 5,'default': '','description': 'Dataset to be written to in BigQuery.'}},
          'table': {'field': {'name': 'table','kind': 'string','order': 6,'default': '','description': 'Table to be written to in BigQuery.'}},
          'is_incremental_load': {'field': {'name': 'is_incremental_load','kind': 'boolean','order': 7,'default': False,'description': "Clear data in destination table during this report's time period, then append report data to existing table."}}
        }
      }
    }
  }
]

json_set_fields(TASKS, FIELDS)

project.initialize(_recipe={ 'tasks':TASKS }, _project=CLOUD_PROJECT, _user=USER_CREDENTIALS, _client=CLIENT_CREDENTIALS, _verbose=True, _force=True)
project.execute(_force=True)
