diff --git a/dlp/risk.py b/dlp/risk.py
new file mode 100644
index 00000000000..2a7007646ab
--- /dev/null
+++ b/dlp/risk.py
@@ -0,0 +1,879 @@
+# Copyright 2017 Google Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Sample app that uses the Data Loss Prevent API to perform risk anaylsis."""
+
+from __future__ import print_function
+
+import argparse
+
+
+def numerical_risk_analysis(project, table_project_id, dataset_id, table_id,
+                            column_name, topic_id, subscription_id,
+                            timeout=300):
+    """Uses the Data Loss Prevention API to compute risk metrics of a column
+       of numerical data in a Google BigQuery table.
+    Args:
+        project: The Google Cloud project id to use as a parent resource.
+        table_project_id: The Google Cloud project id where the BigQuery table
+            is stored.
+        dataset_id: The id of the dataset to inspect.
+        table_id: The id of the table to inspect.
+        column_name: The name of the column to compute risk metrics for.
+        topic_id: The name of the Pub/Sub topic to notify once the job
+            completes.
+        subscription_id: The name of the Pub/Sub subscription to use when
+            listening for job completion notifications.
+        timeout: The number of seconds to wait for a response from the API.
+
+    Returns:
+        None; the response from the API is printed to the terminal.
+    """
+
+    # Import the client library.
+    import google.cloud.dlp
+
+    # This sample additionally uses Cloud Pub/Sub to receive results from
+    # potentially long-running operations.
+    import google.cloud.pubsub
+
+    # This sample also uses threading.Event() to wait for the job to finish.
+    import threading
+
+    # Instantiate a client.
+    dlp = google.cloud.dlp.DlpServiceClient()
+
+    # Convert the project id into a full resource id.
+    parent = dlp.project_path(project)
+
+    # Location info of the BigQuery table.
+    source_table = {
+        'project_id': table_project_id,
+        'dataset_id': dataset_id,
+        'table_id': table_id
+    }
+
+    # Tell the API where to send a notification when the job is complete.
+    actions = [{
+        'pub_sub': {'topic': '{}/topics/{}'.format(parent, topic_id)}
+    }]
+
+    # Configure risk analysis job
+    # Give the name of the numeric column to compute risk metrics for
+    risk_job = {
+        'privacy_metric': {
+            'numerical_stats_config': {
+                'field': {
+                    'name': column_name
+                }
+            }
+        },
+        'source_table': source_table,
+        'actions': actions
+    }
+
+    # Call API to start risk analysis job
+    operation = dlp.create_dlp_job(parent, risk_job=risk_job)
+
+    # Create a Pub/Sub client and find the subscription. The subscription is
+    # expected to already be listening to the topic.
+    subscriber = google.cloud.pubsub.SubscriberClient()
+    subscription_path = subscriber.subscription_path(
+        project, subscription_id)
+    subscription = subscriber.subscribe(subscription_path)
+
+    # Set up a callback to acknowledge a message. This closes around an event
+    # so that it can signal that it is done and the main thread can continue.
+    job_done = threading.Event()
+
+    def callback(message):
+        try:
+            if (message.attributes['DlpJobName'] == operation.name):
+                # This is the message we're looking for, so acknowledge it.
+                message.ack()
+
+                # Now that the job is done, fetch the results and print them.
+                job = dlp.get_dlp_job(operation.name)
+                results = job.risk_details.numerical_stats_result
+                print('Value Range: [{}, {}]'.format(
+                    results.min_value.integer_value,
+                    results.max_value.integer_value))
+                prev_value = None
+                for percent, result in enumerate(results.quantile_values):
+                    value = result.integer_value
+                    if prev_value != value:
+                        print('Value at {}% quantile: {}'.format(
+                              percent, value))
+                        prev_value = value
+                # Signal to the main thread that we can exit.
+                job_done.set()
+            else:
+                # This is not the message we're looking for.
+                message.drop()
+        except Exception as e:
+            # Because this is executing in a thread, an exception won't be
+            # noted unless we print it manually.
+            print(e)
+            raise
+
+    # Register the callback and wait on the event.
+    subscription.open(callback)
+    finished = job_done.wait(timeout=timeout)
+    if not finished:
+        print('No event received before the timeout. Please verify that the '
+              'subscription provided is subscribed to the topic provided.')
+
+
+def categorical_risk_analysis(project, table_project_id, dataset_id, table_id,
+                              column_name, topic_id, subscription_id,
+                              timeout=300):
+    """Uses the Data Loss Prevention API to compute risk metrics of a column
+       of categorical data in a Google BigQuery table.
+    Args:
+        project: The Google Cloud project id to use as a parent resource.
+        table_project_id: The Google Cloud project id where the BigQuery table
+            is stored.
+        dataset_id: The id of the dataset to inspect.
+        table_id: The id of the table to inspect.
+        column_name: The name of the column to compute risk metrics for.
+        topic_id: The name of the Pub/Sub topic to notify once the job
+            completes.
+        subscription_id: The name of the Pub/Sub subscription to use when
+            listening for job completion notifications.
+        timeout: The number of seconds to wait for a response from the API.
+
+    Returns:
+        None; the response from the API is printed to the terminal.
+    """
+
+    # Import the client library.
+    import google.cloud.dlp
+
+    # This sample additionally uses Cloud Pub/Sub to receive results from
+    # potentially long-running operations.
+    import google.cloud.pubsub
+
+    # This sample also uses threading.Event() to wait for the job to finish.
+    import threading
+
+    # Instantiate a client.
+    dlp = google.cloud.dlp.DlpServiceClient()
+
+    # Convert the project id into a full resource id.
+    parent = dlp.project_path(project)
+
+    # Location info of the BigQuery table.
+    source_table = {
+        'project_id': table_project_id,
+        'dataset_id': dataset_id,
+        'table_id': table_id
+    }
+
+    # Tell the API where to send a notification when the job is complete.
+    actions = [{
+        'pub_sub': {'topic': '{}/topics/{}'.format(parent, topic_id)}
+    }]
+
+    # Configure risk analysis job
+    # Give the name of the numeric column to compute risk metrics for
+    risk_job = {
+        'privacy_metric': {
+            'categorical_stats_config': {
+                'field': {
+                    'name': column_name
+                }
+            }
+        },
+        'source_table': source_table,
+        'actions': actions
+    }
+
+    # Call API to start risk analysis job
+    operation = dlp.create_dlp_job(parent, risk_job=risk_job)
+
+    # Create a Pub/Sub client and find the subscription. The subscription is
+    # expected to already be listening to the topic.
+    subscriber = google.cloud.pubsub.SubscriberClient()
+    subscription_path = subscriber.subscription_path(
+        project, subscription_id)
+    subscription = subscriber.subscribe(subscription_path)
+
+    # Set up a callback to acknowledge a message. This closes around an event
+    # so that it can signal that it is done and the main thread can continue.
+    job_done = threading.Event()
+
+    def callback(message):
+        try:
+            if (message.attributes['DlpJobName'] == operation.name):
+                # This is the message we're looking for, so acknowledge it.
+                message.ack()
+
+                # Now that the job is done, fetch the results and print them.
+                job = dlp.get_dlp_job(operation.name)
+                histogram_buckets = (job.risk_details
+                                        .categorical_stats_result
+                                        .value_frequency_histogram_buckets)
+                # Print bucket stats
+                for i, bucket in enumerate(histogram_buckets):
+                    print('Bucket {}:'.format(i))
+                    print('   Most common value occurs {} time(s)'.format(
+                        bucket.value_frequency_upper_bound))
+                    print('   Least common value occurs {} time(s)'.format(
+                        bucket.value_frequency_lower_bound))
+                    print('   {} unique values total.'.format(
+                        bucket.bucket_size))
+                    for value in bucket.bucket_values:
+                        print('   Value {} occurs {} time(s)'.format(
+                            value.value.integer_value, value.count))
+                # Signal to the main thread that we can exit.
+                job_done.set()
+            else:
+                # This is not the message we're looking for.
+                message.drop()
+        except Exception as e:
+            # Because this is executing in a thread, an exception won't be
+            # noted unless we print it manually.
+            print(e)
+            raise
+
+    # Register the callback and wait on the event.
+    subscription.open(callback)
+    finished = job_done.wait(timeout=timeout)
+    if not finished:
+        print('No event received before the timeout. Please verify that the '
+              'subscription provided is subscribed to the topic provided.')
+
+
+def k_anonymity_analysis(project, table_project_id, dataset_id, table_id,
+                         topic_id, subscription_id, quasi_ids, timeout=300):
+    """Uses the Data Loss Prevention API to compute the k-anonymity of a
+        column set in a Google BigQuery table.
+    Args:
+        project: The Google Cloud project id to use as a parent resource.
+        table_project_id: The Google Cloud project id where the BigQuery table
+            is stored.
+        dataset_id: The id of the dataset to inspect.
+        table_id: The id of the table to inspect.
+        topic_id: The name of the Pub/Sub topic to notify once the job
+            completes.
+        subscription_id: The name of the Pub/Sub subscription to use when
+            listening for job completion notifications.
+        quasi_ids: A set of columns that form a composite key.
+        timeout: The number of seconds to wait for a response from the API.
+
+    Returns:
+        None; the response from the API is printed to the terminal.
+    """
+
+    # Import the client library.
+    import google.cloud.dlp
+
+    # This sample additionally uses Cloud Pub/Sub to receive results from
+    # potentially long-running operations.
+    import google.cloud.pubsub
+
+    # This sample also uses threading.Event() to wait for the job to finish.
+    import threading
+
+    # Instantiate a client.
+    dlp = google.cloud.dlp.DlpServiceClient()
+
+    # Convert the project id into a full resource id.
+    parent = dlp.project_path(project)
+
+    # Location info of the BigQuery table.
+    source_table = {
+        'project_id': table_project_id,
+        'dataset_id': dataset_id,
+        'table_id': table_id
+    }
+
+    # Convert quasi id list to Protobuf type
+    def map_fields(field):
+        return {'name': field}
+
+    quasi_ids = map(map_fields, quasi_ids)
+
+    # Tell the API where to send a notification when the job is complete.
+    actions = [{
+        'pub_sub': {'topic': '{}/topics/{}'.format(parent, topic_id)}
+    }]
+
+    # Configure risk analysis job
+    # Give the name of the numeric column to compute risk metrics for
+    risk_job = {
+        'privacy_metric': {
+            'k_anonymity_config': {
+                'quasi_ids': quasi_ids
+            }
+        },
+        'source_table': source_table,
+        'actions': actions
+    }
+    # Call API to start risk analysis job
+    operation = dlp.create_dlp_job(parent, risk_job=risk_job)
+
+    # Create a Pub/Sub client and find the subscription. The subscription is
+    # expected to already be listening to the topic.
+    subscriber = google.cloud.pubsub.SubscriberClient()
+    subscription_path = subscriber.subscription_path(
+        project, subscription_id)
+    subscription = subscriber.subscribe(subscription_path)
+
+    # Set up a callback to acknowledge a message. This closes around an event
+    # so that it can signal that it is done and the main thread can continue.
+    job_done = threading.Event()
+
+    # Create helper function for unpacking values
+    def get_values(obj):
+        return int(obj.integer_value)
+
+    def callback(message):
+        try:
+            if (message.attributes['DlpJobName'] == operation.name):
+                # This is the message we're looking for, so acknowledge it.
+                message.ack()
+
+                # Now that the job is done, fetch the results and print them.
+                job = dlp.get_dlp_job(operation.name)
+                histogram_buckets = (job.risk_details
+                                        .k_anonymity_result
+                                        .equivalence_class_histogram_buckets)
+                # Print bucket stats
+                for i, bucket in enumerate(histogram_buckets):
+                    print('Bucket {}:'.format(i))
+                    if bucket.equivalence_class_size_lower_bound:
+                        print('   Bucket size range: [{}, {}]'.format(
+                             bucket.equivalence_class_size_lower_bound,
+                             bucket.equivalence_class_size_upper_bound))
+                        for value_bucket in bucket.bucket_values:
+                            print('   Quasi-ID values: {}'.format(
+                                map(get_values, value_bucket.quasi_ids_values)
+                                ))
+                            print('   Class size: {}'.format(
+                                value_bucket.equivalence_class_size))
+                # Signal to the main thread that we can exit.
+                job_done.set()
+            else:
+                # This is not the message we're looking for.
+                message.drop()
+        except Exception as e:
+            # Because this is executing in a thread, an exception won't be
+            # noted unless we print it manually.
+            print(e)
+            raise
+
+    # Register the callback and wait on the event.
+    subscription.open(callback)
+    finished = job_done.wait(timeout=timeout)
+    if not finished:
+        print('No event received before the timeout. Please verify that the '
+              'subscription provided is subscribed to the topic provided.')
+
+
+def l_diversity_analysis(project, table_project_id, dataset_id, table_id,
+                         topic_id, subscription_id, sensitive_attribute,
+                         quasi_ids, timeout=300):
+    """Uses the Data Loss Prevention API to compute the l-diversity of a
+        column set in a Google BigQuery table.
+    Args:
+        project: The Google Cloud project id to use as a parent resource.
+        table_project_id: The Google Cloud project id where the BigQuery table
+            is stored.
+        dataset_id: The id of the dataset to inspect.
+        table_id: The id of the table to inspect.
+        topic_id: The name of the Pub/Sub topic to notify once the job
+            completes.
+        subscription_id: The name of the Pub/Sub subscription to use when
+            listening for job completion notifications.
+        sensitive_attribute: The column to measure l-diversity relative to.
+        quasi_ids: A set of columns that form a composite key.
+        timeout: The number of seconds to wait for a response from the API.
+
+    Returns:
+        None; the response from the API is printed to the terminal.
+    """
+
+    # Import the client library.
+    import google.cloud.dlp
+
+    # This sample additionally uses Cloud Pub/Sub to receive results from
+    # potentially long-running operations.
+    import google.cloud.pubsub
+
+    # This sample also uses threading.Event() to wait for the job to finish.
+    import threading
+
+    # Instantiate a client.
+    dlp = google.cloud.dlp.DlpServiceClient()
+
+    # Convert the project id into a full resource id.
+    parent = dlp.project_path(project)
+
+    # Location info of the BigQuery table.
+    source_table = {
+        'project_id': table_project_id,
+        'dataset_id': dataset_id,
+        'table_id': table_id
+    }
+
+    # Convert quasi id list to Protobuf type
+    def map_fields(field):
+        return {'name': field}
+
+    quasi_ids = map(map_fields, quasi_ids)
+
+    # Tell the API where to send a notification when the job is complete.
+    actions = [{
+        'pub_sub': {'topic': '{}/topics/{}'.format(parent, topic_id)}
+    }]
+
+    # Configure risk analysis job
+    # Give the name of the numeric column to compute risk metrics for
+    risk_job = {
+        'privacy_metric': {
+            'l_diversity_config': {
+                'quasi_ids': quasi_ids,
+                'sensitive_attribute': {
+                    'name': sensitive_attribute
+                }
+            }
+        },
+        'source_table': source_table,
+        'actions': actions
+    }
+
+    # Call API to start risk analysis job
+    operation = dlp.create_dlp_job(parent, risk_job=risk_job)
+
+    # Create a Pub/Sub client and find the subscription. The subscription is
+    # expected to already be listening to the topic.
+    subscriber = google.cloud.pubsub.SubscriberClient()
+    subscription_path = subscriber.subscription_path(
+        project, subscription_id)
+    subscription = subscriber.subscribe(subscription_path)
+
+    # Set up a callback to acknowledge a message. This closes around an event
+    # so that it can signal that it is done and the main thread can continue.
+    job_done = threading.Event()
+
+    # Create helper function for unpacking values
+    def get_values(obj):
+        return int(obj.integer_value)
+
+    def callback(message):
+        try:
+            if (message.attributes['DlpJobName'] == operation.name):
+                # This is the message we're looking for, so acknowledge it.
+                message.ack()
+
+                # Now that the job is done, fetch the results and print them.
+                job = dlp.get_dlp_job(operation.name)
+                histogram_buckets = (
+                    job.risk_details
+                       .l_diversity_result
+                       .sensitive_value_frequency_histogram_buckets)
+                # Print bucket stats
+                for i, bucket in enumerate(histogram_buckets):
+                    print('Bucket {}:'.format(i))
+                    print('   Bucket size range: [{}, {}]'.format(
+                         bucket.sensitive_value_frequency_lower_bound,
+                         bucket.sensitive_value_frequency_upper_bound))
+                    for value_bucket in bucket.bucket_values:
+                        print('   Quasi-ID values: {}'.format(
+                            map(get_values, value_bucket.quasi_ids_values)))
+                        print('   Class size: {}'.format(
+                            value_bucket.equivalence_class_size))
+                        for value in value_bucket.top_sensitive_values:
+                            print(('   Sensitive value {} occurs {} time(s)'
+                                   .format(value.value, value.count)))
+                # Signal to the main thread that we can exit.
+                job_done.set()
+            else:
+                # This is not the message we're looking for.
+                message.drop()
+        except Exception as e:
+            # Because this is executing in a thread, an exception won't be
+            # noted unless we print it manually.
+            print(e)
+            raise
+
+    # Register the callback and wait on the event.
+    subscription.open(callback)
+    finished = job_done.wait(timeout=timeout)
+    if not finished:
+        print('No event received before the timeout. Please verify that the '
+              'subscription provided is subscribed to the topic provided.')
+
+
+def k_map_estimate_analysis(project, table_project_id, dataset_id, table_id,
+                            topic_id, subscription_id, quasi_ids, info_types,
+                            region_code='US', timeout=300):
+    """Uses the Data Loss Prevention API to compute the k-map risk estimation
+        of a column set in a Google BigQuery table.
+    Args:
+        project: The Google Cloud project id to use as a parent resource.
+        table_project_id: The Google Cloud project id where the BigQuery table
+            is stored.
+        dataset_id: The id of the dataset to inspect.
+        table_id: The id of the table to inspect.
+        column_name: The name of the column to compute risk metrics for.
+        topic_id: The name of the Pub/Sub topic to notify once the job
+            completes.
+        subscription_id: The name of the Pub/Sub subscription to use when
+            listening for job completion notifications.
+        quasi_ids: A set of columns that form a composite key and optionally
+            their reidentification distributions.
+        info_types: Type of information of the quasi_id in order to provide a
+            statistical model of population.
+        region_code: The ISO 3166-1 region code that the data is representative
+            of. Can be omitted if using a region-specific infoType (such as
+            US_ZIP_5)
+        timeout: The number of seconds to wait for a response from the API.
+
+    Returns:
+        None; the response from the API is printed to the terminal.
+    """
+
+    # Import the client library.
+    import google.cloud.dlp
+
+    # This sample additionally uses Cloud Pub/Sub to receive results from
+    # potentially long-running operations.
+    import google.cloud.pubsub
+
+    # This sample also uses threading.Event() to wait for the job to finish.
+    import threading
+
+    # Instantiate a client.
+    dlp = google.cloud.dlp.DlpServiceClient()
+
+    # Convert the project id into a full resource id.
+    parent = dlp.project_path(project)
+
+    # Location info of the BigQuery table.
+    source_table = {
+        'project_id': table_project_id,
+        'dataset_id': dataset_id,
+        'table_id': table_id
+    }
+
+    # Check that numbers of quasi-ids and info types are equal
+    if len(quasi_ids) != len(info_types):
+        raise ValueError("""Number of infoTypes and number of quasi-identifiers
+                            must be equal!""")
+
+    # Convert quasi id list to Protobuf type
+    def map_fields(quasi_id, info_type):
+        return {'field': {'name': quasi_id}, 'info_type': {'name': info_type}}
+
+    quasi_ids = map(map_fields, quasi_ids, info_types)
+
+    # Tell the API where to send a notification when the job is complete.
+    actions = [{
+        'pub_sub': {'topic': '{}/topics/{}'.format(parent, topic_id)}
+    }]
+
+    # Configure risk analysis job
+    # Give the name of the numeric column to compute risk metrics for
+    risk_job = {
+        'privacy_metric': {
+            'k_map_estimation_config': {
+                'quasi_ids': quasi_ids,
+                'region_code': region_code
+            }
+        },
+        'source_table': source_table,
+        'actions': actions
+    }
+
+    # Call API to start risk analysis job
+    operation = dlp.create_dlp_job(parent, risk_job=risk_job)
+
+    # Create a Pub/Sub client and find the subscription. The subscription is
+    # expected to already be listening to the topic.
+    subscriber = google.cloud.pubsub.SubscriberClient()
+    subscription_path = subscriber.subscription_path(
+        project, subscription_id)
+    subscription = subscriber.subscribe(subscription_path)
+
+    # Set up a callback to acknowledge a message. This closes around an event
+    # so that it can signal that it is done and the main thread can continue.
+    job_done = threading.Event()
+
+    # Create helper function for unpacking values
+    def get_values(obj):
+        return int(obj.integer_value)
+
+    def callback(message):
+        try:
+            if (message.attributes['DlpJobName'] == operation.name):
+                # This is the message we're looking for, so acknowledge it.
+                message.ack()
+
+                # Now that the job is done, fetch the results and print them.
+                job = dlp.get_dlp_job(operation.name)
+                histogram_buckets = (job.risk_details
+                                        .k_map_estimation_result
+                                        .k_map_estimation_histogram)
+                # Print bucket stats
+                for i, bucket in enumerate(histogram_buckets):
+                    print('Bucket {}:'.format(i))
+                    print('   Anonymity range: [{}, {}]'.format(
+                        bucket.min_anonymity, bucket.max_anonymity))
+                    print('   Size: {}'.format(bucket.bucket_size))
+                    for value_bucket in bucket.bucket_values:
+                        print('   Values: {}'.format(
+                            map(get_values, value_bucket.quasi_ids_values)))
+                        print('   Estimated k-map anonymity: {}'.format(
+                            value_bucket.estimated_anonymity))
+                # Signal to the main thread that we can exit.
+                job_done.set()
+            else:
+                # This is not the message we're looking for.
+                message.drop()
+        except Exception as e:
+            # Because this is executing in a thread, an exception won't be
+            # noted unless we print it manually.
+            print(e)
+            raise
+
+    # Register the callback and wait on the event.
+    subscription.open(callback)
+    finished = job_done.wait(timeout=timeout)
+    if not finished:
+        print('No event received before the timeout. Please verify that the '
+              'subscription provided is subscribed to the topic provided.')
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description=__doc__)
+    subparsers = parser.add_subparsers(
+        dest='content', help='Select how to submit content to the API.')
+    subparsers.required = True
+
+    numerical_parser = subparsers.add_parser(
+        'numerical',
+        help='')
+    numerical_parser.add_argument(
+        'project',
+        help='The Google Cloud project id to use as a parent resource.')
+    numerical_parser.add_argument(
+        'table_project_id',
+        help='The Google Cloud project id where the BigQuery table is stored.')
+    numerical_parser.add_argument(
+        'dataset_id',
+        help='The id of the dataset to inspect.')
+    numerical_parser.add_argument(
+        'table_id',
+        help='The id of the table to inspect.')
+    numerical_parser.add_argument(
+        'column_name',
+        help='The name of the column to compute risk metrics for.')
+    numerical_parser.add_argument(
+        'topic_id',
+        help='The name of the Pub/Sub topic to notify once the job completes.')
+    numerical_parser.add_argument(
+        'subscription_id',
+        help='The name of the Pub/Sub subscription to use when listening for'
+             'job completion notifications.')
+    numerical_parser.add_argument(
+        '--timeout', type=int,
+        help='The number of seconds to wait for a response from the API.')
+
+    categorical_parser = subparsers.add_parser(
+        'categorical',
+        help='')
+    categorical_parser.add_argument(
+        'project',
+        help='The Google Cloud project id to use as a parent resource.')
+    categorical_parser.add_argument(
+        'table_project_id',
+        help='The Google Cloud project id where the BigQuery table is stored.')
+    categorical_parser.add_argument(
+        'dataset_id',
+        help='The id of the dataset to inspect.')
+    categorical_parser.add_argument(
+        'table_id',
+        help='The id of the table to inspect.')
+    categorical_parser.add_argument(
+        'column_name',
+        help='The name of the column to compute risk metrics for.')
+    categorical_parser.add_argument(
+        'topic_id',
+        help='The name of the Pub/Sub topic to notify once the job completes.')
+    categorical_parser.add_argument(
+        'subscription_id',
+        help='The name of the Pub/Sub subscription to use when listening for'
+             'job completion notifications.')
+    categorical_parser.add_argument(
+        '--timeout', type=int,
+        help='The number of seconds to wait for a response from the API.')
+
+    k_anonymity_parser = subparsers.add_parser(
+        'k_anonymity',
+        help='Computes the k-anonymity of a column set in a Google BigQuery'
+             'table.')
+    k_anonymity_parser.add_argument(
+        'project',
+        help='The Google Cloud project id to use as a parent resource.')
+    k_anonymity_parser.add_argument(
+        'table_project_id',
+        help='The Google Cloud project id where the BigQuery table is stored.')
+    k_anonymity_parser.add_argument(
+        'dataset_id',
+        help='The id of the dataset to inspect.')
+    k_anonymity_parser.add_argument(
+        'table_id',
+        help='The id of the table to inspect.')
+    k_anonymity_parser.add_argument(
+        'topic_id',
+        help='The name of the Pub/Sub topic to notify once the job completes.')
+    k_anonymity_parser.add_argument(
+        'subscription_id',
+        help='The name of the Pub/Sub subscription to use when listening for'
+             'job completion notifications.')
+    k_anonymity_parser.add_argument(
+        'quasi_ids', nargs='+',
+        help='A set of columns that form a composite key.')
+    k_anonymity_parser.add_argument(
+        '--timeout', type=int,
+        help='The number of seconds to wait for a response from the API.')
+
+    l_diversity_parser = subparsers.add_parser(
+        'l_diversity',
+        help='Computes the l-diversity of a column set in a Google BigQuery'
+             'table.')
+    l_diversity_parser.add_argument(
+        'project',
+        help='The Google Cloud project id to use as a parent resource.')
+    l_diversity_parser.add_argument(
+        'table_project_id',
+        help='The Google Cloud project id where the BigQuery table is stored.')
+    l_diversity_parser.add_argument(
+        'dataset_id',
+        help='The id of the dataset to inspect.')
+    l_diversity_parser.add_argument(
+        'table_id',
+        help='The id of the table to inspect.')
+    l_diversity_parser.add_argument(
+        'topic_id',
+        help='The name of the Pub/Sub topic to notify once the job completes.')
+    l_diversity_parser.add_argument(
+        'subscription_id',
+        help='The name of the Pub/Sub subscription to use when listening for'
+             'job completion notifications.')
+    l_diversity_parser.add_argument(
+        'sensitive_attribute',
+        help='The column to measure l-diversity relative to.')
+    l_diversity_parser.add_argument(
+        'quasi_ids', nargs='+',
+        help='A set of columns that form a composite key.')
+    l_diversity_parser.add_argument(
+        '--timeout', type=int,
+        help='The number of seconds to wait for a response from the API.')
+
+    k_map_parser = subparsers.add_parser(
+        'k_map',
+        help='Computes the k-map risk estimation of a column set in a Google'
+             'BigQuery table.')
+    k_map_parser.add_argument(
+        'project',
+        help='The Google Cloud project id to use as a parent resource.')
+    k_map_parser.add_argument(
+        'table_project_id',
+        help='The Google Cloud project id where the BigQuery table is stored.')
+    k_map_parser.add_argument(
+        'dataset_id',
+        help='The id of the dataset to inspect.')
+    k_map_parser.add_argument(
+        'table_id',
+        help='The id of the table to inspect.')
+    k_map_parser.add_argument(
+        'topic_id',
+        help='The name of the Pub/Sub topic to notify once the job completes.')
+    k_map_parser.add_argument(
+        'subscription_id',
+        help='The name of the Pub/Sub subscription to use when listening for'
+             'job completion notifications.')
+    k_map_parser.add_argument(
+        'quasi_ids', nargs='+',
+        help='A set of columns that form a composite key.')
+    k_map_parser.add_argument(
+        '-t', '--info-types', nargs='+',
+        help='Type of information of the quasi_id in order to provide a'
+             'statistical model of population.',
+        required=True)
+    k_map_parser.add_argument(
+        '-r', '--region-code', default='US',
+        help='The ISO 3166-1 region code that the data is representative of.')
+    k_map_parser.add_argument(
+        '--timeout', type=int,
+        help='The number of seconds to wait for a response from the API.')
+
+    args = parser.parse_args()
+
+    if args.content == 'numerical':
+        numerical_risk_analysis(
+            args.project,
+            args.table_project_id,
+            args.dataset_id,
+            args.table_id,
+            args.column_name,
+            args.topic_id,
+            args.subscription_id,
+            timeout=args.timeout)
+    elif args.content == 'categorical':
+        categorical_risk_analysis(
+            args.project,
+            args.table_project_id,
+            args.dataset_id,
+            args.table_id,
+            args.column_name,
+            args.topic_id,
+            args.subscription_id,
+            timeout=args.timeout)
+    elif args.content == 'k_anonymity':
+        k_anonymity_analysis(
+            args.project,
+            args.table_project_id,
+            args.dataset_id,
+            args.table_id,
+            args.topic_id,
+            args.subscription_id,
+            args.quasi_ids,
+            timeout=args.timeout)
+    elif args.content == 'l_diversity':
+        l_diversity_analysis(
+            args.project,
+            args.table_project_id,
+            args.dataset_id,
+            args.table_id,
+            args.topic_id,
+            args.subscription_id,
+            args.sensitive_attribute,
+            args.quasi_ids,
+            timeout=args.timeout)
+    elif args.content == 'k_map':
+        k_map_estimate_analysis(
+            args.project,
+            args.table_project_id,
+            args.dataset_id,
+            args.table_id,
+            args.topic_id,
+            args.subscription_id,
+            args.quasi_ids,
+            args.info_types,
+            region_code=args.region_code,
+            timeout=args.timeout)
diff --git a/dlp/risk_test.py b/dlp/risk_test.py
new file mode 100644
index 00000000000..8fdb5c9e7bb
--- /dev/null
+++ b/dlp/risk_test.py
@@ -0,0 +1,224 @@
+# Copyright 2017 Google Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the 'License');
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an 'AS IS' BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import os
+
+import google.cloud.pubsub
+
+import pytest
+
+import risk
+
+GCLOUD_PROJECT = os.getenv('GCLOUD_PROJECT')
+TOPIC_ID = 'dlp-test'
+SUBSCRIPTION_ID = 'dlp-test-subscription'
+DATASET_ID = 'integration_tests_dlp'
+UNIQUE_FIELD = 'Name'
+REPEATED_FIELD = 'Mystery'
+NUMERIC_FIELD = 'Age'
+STRING_BOOLEAN_FIELD = 'Gender'
+
+
+# Create new custom topic/subscription
+@pytest.fixture(scope='module')
+def topic_id():
+    # Creates a pubsub topic, and tears it down.
+    publisher = google.cloud.pubsub.PublisherClient()
+    topic_path = publisher.topic_path(GCLOUD_PROJECT, TOPIC_ID)
+    try:
+        publisher.create_topic(topic_path)
+    except google.api_core.exceptions.AlreadyExists:
+        pass
+
+    yield TOPIC_ID
+
+    publisher.delete_topic(topic_path)
+
+
+@pytest.fixture(scope='module')
+def subscription_id(topic_id):
+    # Subscribes to a topic.
+    subscriber = google.cloud.pubsub.SubscriberClient()
+    topic_path = subscriber.topic_path(GCLOUD_PROJECT, topic_id)
+    subscription_path = subscriber.subscription_path(
+        GCLOUD_PROJECT, SUBSCRIPTION_ID)
+    try:
+        subscriber.create_subscription(subscription_path, topic_path)
+    except google.api_core.exceptions.AlreadyExists:
+        pass
+
+    yield SUBSCRIPTION_ID
+
+    subscriber.delete_subscription(subscription_path)
+
+
+def test_numerical_risk_analysis(topic_id, subscription_id, capsys):
+    risk.numerical_risk_analysis(
+        GCLOUD_PROJECT,
+        GCLOUD_PROJECT,
+        DATASET_ID,
+        'harmful',
+        NUMERIC_FIELD,
+        topic_id,
+        subscription_id)
+
+    out, _ = capsys.readouterr()
+    assert 'Value Range:' in out
+
+
+def test_categorical_risk_analysis_on_string_field(
+        topic_id, subscription_id, capsys):
+    risk.categorical_risk_analysis(
+        GCLOUD_PROJECT,
+        GCLOUD_PROJECT,
+        DATASET_ID,
+        'harmful',
+        UNIQUE_FIELD,
+        topic_id,
+        subscription_id, timeout=180)
+
+    out, _ = capsys.readouterr()
+    assert 'Most common value occurs' in out
+
+
+def test_categorical_risk_analysis_on_number_field(
+        topic_id, subscription_id, capsys):
+
+    risk.categorical_risk_analysis(
+        GCLOUD_PROJECT,
+        GCLOUD_PROJECT,
+        DATASET_ID,
+        'harmful',
+        NUMERIC_FIELD,
+        topic_id,
+        subscription_id)
+
+    out, _ = capsys.readouterr()
+    assert 'Most common value occurs' in out
+
+
+def test_k_anonymity_analysis_single_field(topic_id, subscription_id, capsys):
+    risk.k_anonymity_analysis(
+        GCLOUD_PROJECT,
+        GCLOUD_PROJECT,
+        DATASET_ID,
+        'harmful',
+        topic_id,
+        subscription_id,
+        [NUMERIC_FIELD])
+
+    out, _ = capsys.readouterr()
+    assert 'Quasi-ID values:' in out
+    assert 'Class size:' in out
+
+
+def test_k_anonymity_analysis_multiple_fields(topic_id, subscription_id,
+                                              capsys):
+    risk.k_anonymity_analysis(
+        GCLOUD_PROJECT,
+        GCLOUD_PROJECT,
+        DATASET_ID,
+        'harmful',
+        topic_id,
+        subscription_id,
+        [NUMERIC_FIELD, REPEATED_FIELD])
+
+    out, _ = capsys.readouterr()
+    assert 'Quasi-ID values:' in out
+    assert 'Class size:' in out
+
+
+def test_l_diversity_analysis_single_field(topic_id, subscription_id, capsys):
+    risk.l_diversity_analysis(
+        GCLOUD_PROJECT,
+        GCLOUD_PROJECT,
+        DATASET_ID,
+        'harmful',
+        topic_id,
+        subscription_id,
+        UNIQUE_FIELD,
+        [NUMERIC_FIELD])
+
+    out, _ = capsys.readouterr()
+    assert 'Quasi-ID values:' in out
+    assert 'Class size:' in out
+    assert 'Sensitive value' in out
+
+
+def test_l_diversity_analysis_multiple_field(
+        topic_id, subscription_id, capsys):
+    risk.l_diversity_analysis(
+        GCLOUD_PROJECT,
+        GCLOUD_PROJECT,
+        DATASET_ID,
+        'harmful',
+        topic_id,
+        subscription_id,
+        UNIQUE_FIELD,
+        [NUMERIC_FIELD, REPEATED_FIELD])
+
+    out, _ = capsys.readouterr()
+    assert 'Quasi-ID values:' in out
+    assert 'Class size:' in out
+    assert 'Sensitive value' in out
+
+
+def test_k_map_estimate_analysis_single_field(
+        topic_id, subscription_id, capsys):
+    risk.k_map_estimate_analysis(
+        GCLOUD_PROJECT,
+        GCLOUD_PROJECT,
+        DATASET_ID,
+        'harmful',
+        topic_id,
+        subscription_id,
+        [NUMERIC_FIELD],
+        ['AGE'])
+
+    out, _ = capsys.readouterr()
+    assert 'Anonymity range:' in out
+    assert 'Size:' in out
+    assert 'Values' in out
+
+
+def test_k_map_estimate_analysis_multiple_field(
+        topic_id, subscription_id, capsys):
+    risk.k_map_estimate_analysis(
+        GCLOUD_PROJECT,
+        GCLOUD_PROJECT,
+        DATASET_ID,
+        'harmful',
+        topic_id,
+        subscription_id,
+        [NUMERIC_FIELD, STRING_BOOLEAN_FIELD],
+        ['AGE', 'GENDER'])
+
+    out, _ = capsys.readouterr()
+    assert 'Anonymity range:' in out
+    assert 'Size:' in out
+    assert 'Values' in out
+
+
+def test_k_map_estimate_analysis_quasi_ids_info_types_equal(
+        topic_id, subscription_id):
+    with pytest.raises(ValueError):
+        risk.k_map_estimate_analysis(
+            GCLOUD_PROJECT,
+            GCLOUD_PROJECT,
+            DATASET_ID,
+            'harmful',
+            topic_id,
+            subscription_id,
+            [NUMERIC_FIELD, STRING_BOOLEAN_FIELD],
+            ['AGE'])