Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Implement 'bigquery.dataset.Dataset'. #1018

Merged
merged 12 commits into from
Jul 28, 2015
1 change: 1 addition & 0 deletions gcloud/bigquery/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -23,3 +23,4 @@

from gcloud.bigquery.client import Client
from gcloud.bigquery.connection import SCOPE
from gcloud.bigquery.dataset import Dataset
12 changes: 12 additions & 0 deletions gcloud/bigquery/client.py
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@

from gcloud.client import JSONClient
from gcloud.bigquery.connection import Connection
from gcloud.bigquery.dataset import Dataset


class Client(JSONClient):
Expand All @@ -41,3 +42,14 @@ class Client(JSONClient):
"""

_connection_class = Connection

def dataset(self, name):
"""Construct a dataset bound to this client.

:type name: string
:param name: Name of the dataset.

:rtype: :class:`gcloud.bigquery.dataset.Dataset`
:returns: a new ``Dataset`` instance
"""
return Dataset(name, client=self)
369 changes: 369 additions & 0 deletions gcloud/bigquery/dataset.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,369 @@
# Copyright 2015 Google Inc. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Define API Datasets."""

import datetime

import pytz
import six

from gcloud.exceptions import NotFound


class Dataset(object):
"""Datasets are containers for tables.

See:
https://cloud.google.com/bigquery/docs/reference/v2/datasets

:type name: string
:param name: the name of the dataset

:type client: :class:`gcloud.bigquery.client.Client`
:param client: A client which holds credentials and project configuration
for the dataset (which requires a project).
"""

def __init__(self, name, client):
self.name = name
self._client = client
self._properties = {}

@property
def project(self):
"""Project bound to the dataset.

:rtype: string
:returns: the project (derived from the client).
"""
return self._client.project

@property
def path(self):
"""URL path for the dataset's APIs.

:rtype: string
:returns: the path based on project and dataste name.
"""
return '/projects/%s/datasets/%s' % (self.project, self.name)

@property
def created(self):
"""Datetime at which the dataset was created.

:rtype: ``datetime.datetime``, or ``NoneType``
:returns: the creation time (None until set from the server).
"""
return _datetime_from_prop(self._properties.get('creationTime'))

@property
def dataset_id(self):
"""ID for the dataset resource.

:rtype: string, or ``NoneType``
:returns: the ID (None until set from the server).
"""
return self._properties.get('id')

@property
def etag(self):
"""ETag for the dataset resource.

:rtype: string, or ``NoneType``
:returns: the ETag (None until set from the server).
"""
return self._properties.get('etag')

@property
def modified(self):
"""Datetime at which the dataset was last modified.

:rtype: ``datetime.datetime``, or ``NoneType``
:returns: the modification time (None until set from the server).
"""
return _datetime_from_prop(self._properties.get('lastModifiedTime'))

@property
def self_link(self):
"""URL for the dataset resource.

:rtype: string, or ``NoneType``
:returns: the URL (None until set from the server).
"""
return self._properties.get('selfLink')

@property
def default_table_expiration_ms(self):
"""Default expiration time for tables in the dataset.

:rtype: integer, or ``NoneType``

This comment was marked as spam.

This comment was marked as spam.

:returns: The time in milliseconds, or None (the default).
"""
return self._properties.get('defaultTableExpirationMs')

@default_table_expiration_ms.setter
def default_table_expiration_ms(self, value):
"""Update default expiration time for tables in the dataset.

:type value: integer, or ``NoneType``
:param value: new default time, in milliseconds

:raises: ValueError for invalid value types.
"""

This comment was marked as spam.

This comment was marked as spam.

if not isinstance(value, six.integer_types) and value is not None:
raise ValueError("Pass an integer, or None")
self._properties['defaultTableExpirationMs'] = value

@property
def description(self):
"""Description of the dataset.

:rtype: string, or ``NoneType``
:returns: The description as set by the user, or None (the default).
"""
return self._properties.get('description')

@description.setter
def description(self, value):
"""Update description of the dataset.

:type value: string, or ``NoneType``
:param value: new description

:raises: ValueError for invalid value types.
"""
if not isinstance(value, six.string_types) and value is not None:
raise ValueError("Pass a string, or None")
self._properties['description'] = value

@property
def friendly_name(self):
"""Title of the dataset.

:rtype: string, or ``NoneType``
:returns: The name as set by the user, or None (the default).
"""
return self._properties.get('friendlyName')

@friendly_name.setter
def friendly_name(self, value):
"""Update title of the dataset.

:type value: string, or ``NoneType``
:param value: new title

:raises: ValueError for invalid value types.
"""
if not isinstance(value, six.string_types) and value is not None:
raise ValueError("Pass a string, or None")
self._properties['friendlyName'] = value

@property
def location(self):
"""Location in which the dataset is hosted.

:rtype: string, or ``NoneType``
:returns: The location as set by the user, or None (the default).
"""
return self._properties.get('location')

@location.setter
def location(self, value):
"""Update location in which the dataset is hosted.

:type value: string, or ``NoneType``
:param value: new location

:raises: ValueError for invalid value types.
"""
if not isinstance(value, six.string_types) and value is not None:
raise ValueError("Pass a string, or None")
self._properties['location'] = value

def _require_client(self, client):
"""Check client or verify over-ride.

:type client: :class:`gcloud.bigquery.client.Client` or ``NoneType``
:param client: the client to use. If not passed, falls back to the
``client`` stored on the current dataset.

:rtype: :class:`gcloud.bigquery.client.Client`
:returns: The client passed in or the currently bound client.
"""
if client is None:
client = self._client
return client

def _set_properties(self, api_response):
"""Update properties from resource in body of ``api_response``

:type api_response: httplib2.Response
:param api_response: response returned from an API call
"""
self._properties.clear()
cleaned = api_response.copy()
cleaned['creationTime'] = float(cleaned['creationTime'])

This comment was marked as spam.

This comment was marked as spam.

cleaned['lastModifiedTime'] = float(cleaned['lastModifiedTime'])
self._properties.update(cleaned)

def _build_resource(self):
"""Generate a resource for ``create`` or ``update``."""
resource = {
'datasetReference': {
'projectId': self.project, 'datasetId': self.name},
}
if self.default_table_expiration_ms is not None:
value = self.default_table_expiration_ms
resource['defaultTableExpirationMs'] = value

if self.description is not None:
resource['description'] = self.description

if self.friendly_name is not None:
resource['friendlyName'] = self.friendly_name

if self.location is not None:
resource['location'] = self.location

return resource

def create(self, client=None):
"""API call: create the dataset via a PUT request

See:
https://cloud.google.com/bigquery/reference/rest/v2/tables/insert

:type client: :class:`gcloud.bigquery.client.Client` or ``NoneType``
:param client: the client to use. If not passed, falls back to the
``client`` stored on the current dataset.
"""
client = self._require_client(client)
path = '/projects/%s/datasets' % (self.project,)
api_response = client.connection.api_request(
method='POST', path=path, data=self._build_resource())
self._set_properties(api_response)

def exists(self, client=None):
"""API call: test for the existence of the dataset via a GET request

See
https://cloud.google.com/bigquery/docs/reference/v2/datasets/get

:type client: :class:`gcloud.bigquery.client.Client` or ``NoneType``
:param client: the client to use. If not passed, falls back to the
``client`` stored on the current dataset.
"""
client = self._require_client(client)

try:
client.connection.api_request(method='GET', path=self.path,
query_params={'fields': 'id'})
except NotFound:
return False
else:
return True

def reload(self, client=None):
"""API call: refresh dataset properties via a GET request

See
https://cloud.google.com/bigquery/docs/reference/v2/datasets/get

:type client: :class:`gcloud.bigquery.client.Client` or ``NoneType``
:param client: the client to use. If not passed, falls back to the
``client`` stored on the current dataset.
"""
client = self._require_client(client)

api_response = client.connection.api_request(
method='GET', path=self.path)
self._set_properties(api_response)

def patch(self, client=None, **kw):

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

"""API call: update individual dataset properties via a PATCH request

See
https://cloud.google.com/bigquery/docs/reference/v2/datasets/patch

:type client: :class:`gcloud.bigquery.client.Client` or ``NoneType``
:param client: the client to use. If not passed, falls back to the
``client`` stored on the current dataset.

:type kw: ``dict``
:param kw: properties to be patched.

This comment was marked as spam.

This comment was marked as spam.


:raises: ValueError for invalid value types.
"""
client = self._require_client(client)

partial = {}

if 'default_table_expiration_ms' in kw:
value = kw['default_table_expiration_ms']
if not isinstance(value, six.integer_types) and value is not None:
raise ValueError("Pass an integer, or None")
partial['defaultTableExpirationMs'] = value

if 'description' in kw:
partial['description'] = kw['description']

if 'friendly_name' in kw:
partial['friendlyName'] = kw['friendly_name']

if 'location' in kw:
partial['location'] = kw['location']

api_response = client.connection.api_request(
method='PATCH', path=self.path, data=partial)
self._set_properties(api_response)

def update(self, client=None):
"""API call: update dataset properties via a PUT request

See
https://cloud.google.com/bigquery/docs/reference/v2/datasets/update

:type client: :class:`gcloud.bigquery.client.Client` or ``NoneType``
:param client: the client to use. If not passed, falls back to the
``client`` stored on the current dataset.
"""
client = self._require_client(client)
api_response = client.connection.api_request(
method='PUT', path=self.path, data=self._build_resource())
self._set_properties(api_response)

def delete(self, client=None):
"""API call: delete the dataset via a DELETE request

See:
https://cloud.google.com/bigquery/reference/rest/v2/datasets/delete

:type client: :class:`gcloud.bigquery.client.Client` or ``NoneType``
:param client: the client to use. If not passed, falls back to the
``client`` stored on the current dataset.
"""
client = self._require_client(client)
client.connection.api_request(method='DELETE', path=self.path)


def _datetime_from_prop(value):
"""Convert non-none timestamp to datetime, assuming UTC.

:rtype: ``datetime.datetime``, or ``NoneType``
"""
if value is not None:
# back-end returns timestamps as milliseconds since the epoch
value = datetime.datetime.utcfromtimestamp(value / 1000.0)

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

This comment was marked as spam.

return value.replace(tzinfo=pytz.utc)
Loading