Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

BigQuery: Add ORC format support for load jobs, missing bigtable support. #3391

Merged
merged 8 commits into from
Jun 19, 2018
Original file line number Diff line number Diff line change
@@ -0,0 +1,203 @@
/*
* Copyright 2018 Google LLC
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.google.cloud.bigquery;


import com.google.common.base.Function;
import com.google.common.base.MoreObjects;
import java.io.Serializable;
import java.util.Objects;

public class BigtableColumn implements Serializable {


static final Function<com.google.api.services.bigquery.model.BigtableColumn, BigtableColumn> FROM_PB_FUNCTION =
new Function<com.google.api.services.bigquery.model.BigtableColumn, BigtableColumn>() {
@Override
public BigtableColumn apply(
com.google.api.services.bigquery.model.BigtableColumn pb) {
return BigtableColumn.fromPb(pb);
}
};

static final Function<BigtableColumn, com.google.api.services.bigquery.model.BigtableColumn> TO_PB_FUNCTION =
new Function<BigtableColumn, com.google.api.services.bigquery.model.BigtableColumn>() {
@Override
public com.google.api.services.bigquery.model.BigtableColumn apply(
BigtableColumn column) {
return column.toPb();
}
};

private static final long serialVersionUID = 1L;

public String getQualifierEncoded() { return qualifierEncoded; }
public String getFieldName() { return fieldName; }
public Boolean getOnlyReadLatest() { return onlyReadLatest; }
public String getEncoding() { return encoding; }
public String getType() { return type; }

private final String qualifierEncoded;
private final String fieldName;
private final Boolean onlyReadLatest;
private final String encoding;
private final String type;

static final class Builder {
private String qualifierEncoded;
private String fieldName;
private Boolean onlyReadLatest;
private String encoding;
private String type;

private Builder() {}

This comment was marked as spam.

This comment was marked as spam.

/**
* Qualifier of the column.
*
* Columns in the parent column family that has this exact qualifier are exposed
* as . field. If the qualifier is valid UTF-8 string, it can be specified in the
* qualifier_string field. Otherwise, a base-64 encoded value must be set to qualifier_encoded. The column field name is the same as the
* column qualifier. However, if the qualifier is not a valid BigQuery field
* identifier, a valid identifier must be provided as field_name.
*/
Builder setQualifierEncoded(String qualifierEncoded) {
this.qualifierEncoded = qualifierEncoded;

This comment was marked as spam.

This comment was marked as spam.

return this;
}

/**
* If the qualifier is not a valid BigQuery field identifier, a valid identifier must
* be provided as the column field name and is used as field name in queries.
*/
Builder setFieldName(String fieldName) {
this.fieldName = fieldName;
return this;
}

/**
* If this is set, only the latest version of value in this column are exposed.
*
* 'onlyReadLatest' can also be set at the column family level. However, the setting
* at the column level takes precedence if 'onlyReadLatest' is set at both levels.
*/
Builder setOnlyReadLatest(Boolean onlyReadLatest) {
this.onlyReadLatest = onlyReadLatest;
return this;
}

/**
* The encoding of the values when the type is not STRING.
* Acceptable encoding values are:
* TEXT - indicates values are alphanumeric text strings.
* BINARY - indicates values are encoded using HBase Bytes.toBytes family of functions.
*
* Encoding can also be set at the column family level. However, the setting at the
* column level takes precedence if 'encoding' is set at both levels.
*/
Builder setEncoding(String encoding) {
this.encoding = encoding;
return this;
}

/**
* The type to convert the value in cells of this column.
*
* The values are expected to be encoded using HBase Bytes.toBytes function when using
* the BINARY encoding value. Following BigQuery types are allowed (case-sensitive):
* BYTES STRING INTEGER FLOAT BOOLEAN Default type is BYTES.
*
* 'type' can also be set at the column family level. However, the setting at the column
* level takes precedence if 'type' is set at both levels.
*
*/
Builder setType(String type) {
this.type = type;
return this;
}

BigtableColumn build() {return new BigtableColumn(this);}
}

BigtableColumn(Builder builder) {
qualifierEncoded = builder.qualifierEncoded;
fieldName = builder.fieldName;
onlyReadLatest = builder.onlyReadLatest;
encoding = builder.encoding;
type = builder.type;
}

@Override
public String toString() {
return MoreObjects.toStringHelper(this)
.add("qualifierEncoded", qualifierEncoded)
.add("fieldName", fieldName)
.add("onlyReadLatest", onlyReadLatest)
.add("encoding", encoding)
.add("type", type)
.toString();
}

@Override
public final int hashCode() {
return Objects.hash(
qualifierEncoded,
fieldName,
onlyReadLatest,
encoding,
type);
}

@Override
public final boolean equals(Object obj) {
if (obj == this) {
return true;
}
if (obj == null || !obj.getClass().equals(BigtableColumn.class)) {
return false;
}
BigtableColumn other = (BigtableColumn) obj;
return qualifierEncoded == other.qualifierEncoded
&& fieldName == other.fieldName
&& onlyReadLatest == other.onlyReadLatest
&& encoding == other.encoding
&& type == other.type;
}

static Builder newBuilder() {
return new Builder();
}

static BigtableColumn fromPb(com.google.api.services.bigquery.model.BigtableColumn column) {
Builder builder = new BigtableColumn.Builder();
builder.setQualifierEncoded(column.getQualifierEncoded());
builder.setFieldName(column.getFieldName());
builder.setOnlyReadLatest(column.getOnlyReadLatest());
builder.setEncoding(column.getEncoding());
builder.setType(column.getType());
return builder.build();
}

com.google.api.services.bigquery.model.BigtableColumn toPb() {
com.google.api.services.bigquery.model.BigtableColumn column = new com.google.api.services.bigquery.model.BigtableColumn()
.setQualifierEncoded(qualifierEncoded)
.setFieldName(fieldName)
.setOnlyReadLatest(onlyReadLatest)
.setEncoding(encoding)
.setType(type);
return column;
}
}
Loading