| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| package org.apache.rya.api.resolver.triple.impl; |
| |
| import static org.apache.rya.api.RdfCloudTripleStoreConstants.DELIM_BYTE; |
| import static org.apache.rya.api.RdfCloudTripleStoreConstants.DELIM_BYTES; |
| import static org.apache.rya.api.RdfCloudTripleStoreConstants.EMPTY_BYTES; |
| import static org.apache.rya.api.RdfCloudTripleStoreConstants.TYPE_DELIM_BYTE; |
| |
| import java.nio.charset.StandardCharsets; |
| import java.security.MessageDigest; |
| import java.security.NoSuchAlgorithmException; |
| import java.util.Arrays; |
| import java.util.HashMap; |
| import java.util.Map; |
| |
| import org.apache.commons.codec.binary.Hex; |
| import org.apache.rya.api.RdfCloudTripleStoreConstants.TABLE_LAYOUT; |
| import org.apache.rya.api.domain.RyaStatement; |
| import org.apache.rya.api.domain.RyaType; |
| import org.apache.rya.api.domain.RyaIRI; |
| import org.apache.rya.api.resolver.RyaContext; |
| import org.apache.rya.api.resolver.RyaTypeResolverException; |
| import org.apache.rya.api.resolver.triple.TripleRow; |
| import org.apache.rya.api.resolver.triple.TripleRowResolver; |
| import org.apache.rya.api.resolver.triple.TripleRowResolverException; |
| |
| import com.google.common.primitives.Bytes; |
| |
| /** |
| * Will store triple in spo, po, osp. Storing everything in the whole row. |
| * Date: 7/13/12 |
| * Time: 8:51 AM |
| */ |
| public class WholeRowHashedTripleResolver implements TripleRowResolver { |
| |
| @Override |
| public Map<TABLE_LAYOUT, TripleRow> serialize(final RyaStatement stmt) throws TripleRowResolverException { |
| try { |
| final RyaIRI subject = stmt.getSubject(); |
| final RyaIRI predicate = stmt.getPredicate(); |
| final RyaType object = stmt.getObject(); |
| final RyaIRI context = stmt.getContext(); |
| final Long timestamp = stmt.getTimestamp(); |
| final byte[] columnVisibility = stmt.getColumnVisibility(); |
| final String qualifer = stmt.getQualifer(); |
| final byte[] qualBytes = qualifer == null ? EMPTY_BYTES : qualifer.getBytes(StandardCharsets.UTF_8); |
| final byte[] value = stmt.getValue(); |
| assert subject != null && predicate != null && object != null; |
| final byte[] cf = (context == null) ? EMPTY_BYTES : context.getData().getBytes(StandardCharsets.UTF_8); |
| final Map<TABLE_LAYOUT, TripleRow> tripleRowMap = new HashMap<TABLE_LAYOUT, TripleRow>(); |
| final MessageDigest md = MessageDigest.getInstance("MD5"); |
| final byte[] subjBytes = subject.getData().getBytes(StandardCharsets.UTF_8); |
| final byte[] subjHashBytes = md.digest(subjBytes); |
| final byte[] predBytes = predicate.getData().getBytes(StandardCharsets.UTF_8); |
| final byte[] predHashBytes = md.digest(predBytes); |
| final byte[][] objBytes = RyaContext.getInstance().serializeType(object); |
| tripleRowMap.put(TABLE_LAYOUT.SPO, |
| new TripleRow(Bytes.concat(Hex.encodeHexString(subjHashBytes).getBytes(StandardCharsets.UTF_8), DELIM_BYTES, subjBytes, DELIM_BYTES, |
| predBytes, DELIM_BYTES, |
| objBytes[0], objBytes[1]), cf, qualBytes, |
| timestamp, columnVisibility, value)); |
| tripleRowMap.put(TABLE_LAYOUT.PO, |
| new TripleRow(Bytes.concat(Hex.encodeHexString(predHashBytes).getBytes(StandardCharsets.UTF_8), DELIM_BYTES, predBytes, DELIM_BYTES, |
| objBytes[0], DELIM_BYTES, |
| subjBytes, objBytes[1]), cf, qualBytes, |
| timestamp, columnVisibility, value)); |
| tripleRowMap.put(TABLE_LAYOUT.OSP, |
| new TripleRow(Bytes.concat(objBytes[0], DELIM_BYTES, |
| subjBytes, DELIM_BYTES, |
| predBytes, objBytes[1]), cf, qualBytes, |
| timestamp, columnVisibility, value)); |
| return tripleRowMap; |
| } catch (final RyaTypeResolverException e) { |
| throw new TripleRowResolverException(e); |
| } catch (final NoSuchAlgorithmException e) { |
| throw new TripleRowResolverException(e); |
| } |
| } |
| |
| @Override |
| public RyaStatement deserialize(final TABLE_LAYOUT table_layout, final TripleRow tripleRow) throws TripleRowResolverException { |
| try { |
| assert tripleRow != null && table_layout != null; |
| byte[] row = tripleRow.getRow(); |
| |
| // if it is a hashed row, ony keep the row after the hash |
| if ((table_layout == TABLE_LAYOUT.SPO) || (table_layout == TABLE_LAYOUT.PO)) { |
| final int hashStart = Bytes.indexOf(row, DELIM_BYTE); |
| row = Arrays.copyOfRange(row, hashStart + 1, row.length); |
| } |
| |
| final int firstIndex = Bytes.indexOf(row, DELIM_BYTE); |
| final byte[] first= Arrays.copyOf(row, firstIndex); |
| final int secondIndex = Bytes.lastIndexOf(row, DELIM_BYTE); |
| final int typeIndex = Bytes.indexOf(row, TYPE_DELIM_BYTE); |
| final byte[] second = Arrays.copyOfRange(row, firstIndex + 1, secondIndex); |
| final byte[] third = Arrays.copyOfRange(row, secondIndex + 1, typeIndex); |
| final byte[] type = Arrays.copyOfRange(row, typeIndex, row.length); |
| final byte[] columnFamily = tripleRow.getColumnFamily(); |
| final boolean contextExists = columnFamily != null && columnFamily.length > 0; |
| final RyaIRI context = (contextExists) ? (new RyaIRI(new String(columnFamily, StandardCharsets.UTF_8))) : null; |
| final byte[] columnQualifier = tripleRow.getColumnQualifier(); |
| final String qualifier = columnQualifier != null && columnQualifier.length > 0 ? new String(columnQualifier, StandardCharsets.UTF_8) : null; |
| final Long timestamp = tripleRow.getTimestamp(); |
| final byte[] columnVisibility = tripleRow.getColumnVisibility(); |
| final byte[] value = tripleRow.getValue(); |
| |
| switch (table_layout) { |
| case SPO: { |
| final byte[] obj = Bytes.concat(third, type); |
| return new RyaStatement( |
| new RyaIRI(new String(first, StandardCharsets.UTF_8)), |
| new RyaIRI(new String(second, StandardCharsets.UTF_8)), |
| RyaContext.getInstance().deserialize(obj), |
| context, qualifier, columnVisibility, value, timestamp); |
| } |
| case PO: { |
| final byte[] obj = Bytes.concat(second, type); |
| return new RyaStatement( |
| new RyaIRI(new String(third, StandardCharsets.UTF_8)), |
| new RyaIRI(new String(first, StandardCharsets.UTF_8)), |
| RyaContext.getInstance().deserialize(obj), |
| context, qualifier, columnVisibility, value, timestamp); |
| } |
| case OSP: { |
| final byte[] obj = Bytes.concat(first, type); |
| return new RyaStatement( |
| new RyaIRI(new String(second, StandardCharsets.UTF_8)), |
| new RyaIRI(new String(third, StandardCharsets.UTF_8)), |
| RyaContext.getInstance().deserialize(obj), |
| context, qualifier, columnVisibility, value, timestamp); |
| } |
| } |
| } catch (final RyaTypeResolverException e) { |
| throw new TripleRowResolverException(e); |
| } |
| throw new TripleRowResolverException("TripleRow[" + tripleRow + "] with Table layout[" + table_layout + "] is not deserializable"); |
| } |
| |
| } |