doc/html/DescriptorTable_8java_source.html

 // Copyright 2012 Cloudera Inc.

 //

 // Licensed under the Apache License, Version 2.0 (the "License");

 // you may not use this file except in compliance with the License.

 // You may obtain a copy of the License at

 //

 // http://www.apache.org/licenses/LICENSE-2.0

 //

 // Unless required by applicable law or agreed to in writing, software

 // distributed under the License is distributed on an "AS IS" BASIS,

 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 // See the License for the specific language governing permissions and

 // limitations under the License.


 package com.cloudera.impala.analysis;


 import java.util.Collection;

 import java.util.HashMap;

 import java.util.HashSet;

 import java.util.List;


 import com.cloudera.impala.catalog.Table;

 import com.cloudera.impala.catalog.View;

 import com.cloudera.impala.common.IdGenerator;

 import com.cloudera.impala.thrift.TDescriptorTable;

 import com.google.common.base.Preconditions;

 import com.google.common.collect.Lists;

 import com.google.common.collect.Maps;

 import com.google.common.collect.Sets;


 public class DescriptorTable {

   private final HashMap<TupleId, TupleDescriptor> tupleDescs_ = Maps.newHashMap();

   private final HashMap<SlotId, SlotDescriptor> slotDescs_ = Maps.newHashMap();

   private final IdGenerator<TupleId> tupleIdGenerator_ = TupleId.createGenerator();

   private final IdGenerator<SlotId> slotIdGenerator_ = SlotId.createGenerator();

   // List of referenced tables with no associated TupleDescriptor to ship to the BE.

   // For example, the output table of an insert query.

   private final List<Table> referencedTables_ = Lists.newArrayList();

   // For each table, the set of partitions that are referenced by at least one scan range.

   private final HashMap<Table, HashSet<Long>> referencedPartitionsPerTable_ =

       Maps.newHashMap();


   public TupleDescriptor createTupleDescriptor(String debugName) {

     TupleDescriptor d = new TupleDescriptor(tupleIdGenerator_.getNextId(), debugName);

     tupleDescs_.put(d.getId(), d);

     return d;

   }


   public TupleDescriptor copyTupleDescriptor(TupleId srcId, String debugName) {

     TupleDescriptor d = new TupleDescriptor(tupleIdGenerator_.getNextId(), debugName);

     tupleDescs_.put(d.getId(), d);

     // create copies of slots

     TupleDescriptor src = tupleDescs_.get(srcId);

     for (SlotDescriptor slot: src.getSlots()) {

       copySlotDescriptor(d, slot);

     }

     d.computeMemLayout();

     Preconditions.checkState(d.getByteSize() == src.getByteSize());

     return d;

   }


   public SlotDescriptor addSlotDescriptor(TupleDescriptor d) {

     SlotDescriptor result = new SlotDescriptor(slotIdGenerator_.getNextId(), d);

     d.addSlot(result);

     slotDescs_.put(result.getId(), result);

     return result;

   }


   public SlotDescriptor copySlotDescriptor(TupleDescriptor dest, SlotDescriptor src) {

     SlotDescriptor result = new SlotDescriptor(slotIdGenerator_.getNextId(), dest, src);

     dest.addSlot(result);

     slotDescs_.put(result.getId(), result);

     return result;

   }


   public TupleDescriptor getTupleDesc(TupleId id) { return tupleDescs_.get(id); }

   public SlotDescriptor getSlotDesc(SlotId id) { return slotDescs_.get(id); }

   public Collection<TupleDescriptor> getTupleDescs() { return tupleDescs_.values(); }

   public Collection<SlotDescriptor> getSlotDescs() { return slotDescs_.values(); }

   public TupleId getMaxTupleId() { return tupleIdGenerator_.getMaxId(); }

   public SlotId getMaxSlotId() { return slotIdGenerator_.getMaxId(); }


   public void addReferencedTable(Table table) {

     referencedTables_.add(table);

   }


   private HashSet<Long> getReferencedPartitions(Table table) {

     HashSet<Long> refPartitions = referencedPartitionsPerTable_.get(table);

     if (refPartitions == null) {

       refPartitions = new HashSet<Long>();

       referencedPartitionsPerTable_.put(table, refPartitions);

     }

     return refPartitions;

   }


   public void addReferencedPartition(Table table, long partitionId) {

     getReferencedPartitions(table).add(partitionId);

   }


   public void markSlotsMaterialized(List<SlotId> ids) {

     for (SlotId id: ids) {

       getSlotDesc(id).setIsMaterialized(true);

     }

   }


   public List<SlotId> getTupleSlotIds(List<SlotId> slotIds, TupleId tupleId) {

     List<SlotId> result = Lists.newArrayList();

     for (SlotId id: slotIds) {

       if (getSlotDesc(id).getParent().getId().equals(tupleId)) result.add(id);

     }

     return result;

   }


   // Computes physical layout parameters of all descriptors.

   // Call this only after the last descriptor was added.

   // Test-only.

   public void computeMemLayout() {

     for (TupleDescriptor d: tupleDescs_.values()) {

       d.computeMemLayout();

     }

   }


   public TDescriptorTable toThrift() {

     TDescriptorTable result = new TDescriptorTable();

     HashSet<Table> referencedTbls = Sets.newHashSet();

     HashSet<Table> allPartitionsTbls = Sets.newHashSet();

     for (TupleDescriptor tupleDesc: tupleDescs_.values()) {

       // inline view of a non-constant select has a non-materialized tuple descriptor

       // in the descriptor table just for type checking, which we need to skip

       if (tupleDesc.isMaterialized()) {

         result.addToTupleDescriptors(tupleDesc.toThrift());

         Table table = tupleDesc.getTable();

         if (table != null && !(table instanceof View)) referencedTbls.add(table);

         for (SlotDescriptor slotD: tupleDesc.getSlots()) {

           result.addToSlotDescriptors(slotD.toThrift());

         }

       }

     }

     for (Table table: referencedTables_) {

       referencedTbls.add(table);

       // We don't know which partitions are needed for INSERT, so include them all.

       allPartitionsTbls.add(table);

     }

     for (Table tbl: referencedTbls) {

       HashSet<Long> referencedPartitions = null; // null means include all partitions.

       if (!allPartitionsTbls.contains(tbl)) {

         referencedPartitions = getReferencedPartitions(tbl);

       }

       result.addToTableDescriptors(tbl.toThriftDescriptor(referencedPartitions));

     }

     return result;

   }


   public String debugString() {

     StringBuilder out = new StringBuilder();

     out.append("tuples:\n");

     for (TupleDescriptor desc: tupleDescs_.values()) {

       out.append(desc.debugString() + "\n");

     }

     return out.toString();

   }

 }

com.cloudera.impala.analysis.TupleDescriptor
Definition: TupleDescriptor.java:54

com.cloudera.impala.analysis.DescriptorTable.addReferencedPartition
void addReferencedPartition(Table table, long partitionId)
Definition: DescriptorTable.java:116

com.cloudera.impala.catalog.Table
Definition: Table.java:51

com.cloudera.impala.analysis.DescriptorTable.toThrift
TDescriptorTable toThrift()
Definition: DescriptorTable.java:149

com.cloudera.impala.analysis.DescriptorTable.referencedPartitionsPerTable_
final HashMap< Table, HashSet< Long > > referencedPartitionsPerTable_
Definition: DescriptorTable.java:45

com.cloudera.impala.analysis.SlotId
Definition: SlotId.java:20

com.cloudera.impala.catalog.View
Definition: View.java:41

com.cloudera.impala.analysis.DescriptorTable.getMaxTupleId
TupleId getMaxTupleId()
Definition: DescriptorTable.java:92

com.cloudera.impala.analysis.TupleDescriptor.getByteSize
int getByteSize()
Definition: TupleDescriptor.java:122

com.cloudera.impala.analysis.DescriptorTable.getSlotDesc
SlotDescriptor getSlotDesc(SlotId id)
Definition: DescriptorTable.java:89

com.cloudera.impala.analysis.DescriptorTable.getTupleSlotIds
List< SlotId > getTupleSlotIds(List< SlotId > slotIds, TupleId tupleId)
Definition: DescriptorTable.java:132

com.cloudera.impala.analysis.DescriptorTable.computeMemLayout
void computeMemLayout()
Definition: DescriptorTable.java:143

com.cloudera.impala.analysis.DescriptorTable.referencedTables_
final List< Table > referencedTables_
Definition: DescriptorTable.java:43

com.cloudera.impala.analysis.DescriptorTable.copyTupleDescriptor
TupleDescriptor copyTupleDescriptor(TupleId srcId, String debugName)
Definition: DescriptorTable.java:58

com.cloudera.impala.analysis.DescriptorTable.tupleIdGenerator_
final IdGenerator< TupleId > tupleIdGenerator_
Definition: DescriptorTable.java:39

com.cloudera.impala.analysis.DescriptorTable.createTupleDescriptor
TupleDescriptor createTupleDescriptor(String debugName)
Definition: DescriptorTable.java:48

com.cloudera.impala.analysis.DescriptorTable.getTupleDescs
Collection< TupleDescriptor > getTupleDescs()
Definition: DescriptorTable.java:90

com.cloudera.impala.analysis.DescriptorTable.getMaxSlotId
SlotId getMaxSlotId()
Definition: DescriptorTable.java:93

com.cloudera.impala.analysis.DescriptorTable.slotIdGenerator_
final IdGenerator< SlotId > slotIdGenerator_
Definition: DescriptorTable.java:40

com.cloudera.impala.analysis.SlotDescriptor
Definition: SlotDescriptor.java:29

com.cloudera.impala.analysis.DescriptorTable.getSlotDescs
Collection< SlotDescriptor > getSlotDescs()
Definition: DescriptorTable.java:91

com.cloudera.impala.analysis.TupleDescriptor.getSlots
ArrayList< SlotDescriptor > getSlots()
Definition: TupleDescriptor.java:96

com.cloudera.impala.analysis.DescriptorTable.getTupleDesc
TupleDescriptor getTupleDesc(TupleId id)
Definition: DescriptorTable.java:88

com.cloudera.impala.analysis.DescriptorTable.copySlotDescriptor
SlotDescriptor copySlotDescriptor(TupleDescriptor dest, SlotDescriptor src)
Definition: DescriptorTable.java:81

com.cloudera.impala.analysis.DescriptorTable.getReferencedPartitions
HashSet< Long > getReferencedPartitions(Table table)
Definition: DescriptorTable.java:103

com.cloudera.impala.analysis.DescriptorTable.tupleDescs_
final HashMap< TupleId, TupleDescriptor > tupleDescs_
Definition: DescriptorTable.java:37

com.cloudera.impala.analysis.DescriptorTable.slotDescs_
final HashMap< SlotId, SlotDescriptor > slotDescs_
Definition: DescriptorTable.java:38

com.cloudera.impala.analysis.DescriptorTable
Definition: DescriptorTable.java:36

com.cloudera.impala.analysis.DescriptorTable.addReferencedTable
void addReferencedTable(Table table)
Definition: DescriptorTable.java:95

com.cloudera.impala.analysis.TupleId
Definition: TupleId.java:23

com.cloudera.impala.analysis.DescriptorTable.debugString
String debugString()
Definition: DescriptorTable.java:180

com.cloudera.impala.analysis.DescriptorTable.addSlotDescriptor
SlotDescriptor addSlotDescriptor(TupleDescriptor d)
Definition: DescriptorTable.java:71

com.cloudera.impala.analysis.DescriptorTable.markSlotsMaterialized
void markSlotsMaterialized(List< SlotId > ids)
Definition: DescriptorTable.java:123