hive JoinOperator

bupt04406

浏览: 353418 次
性别:
来自: 杭州

最近访客更多访客>>

rotkNirvana

zhangyi0618

xuhai0605

pengcong90

博主相关

博客

微博

相册

留言

关于我

文章分类

社区版块

存档分类

博客分类：

Hive

hive

（1）startGroup：清空各个表的RowContainer
（2）processOp：根据tag，把row add到表对应的RowContainer中。
（3）endGroup：RowContainer中的数据进行join并输出。

RowContainer添加数据时：内存中的数据条数是否达到了blockSize（默认是25000）个，如果有，则写入一个临时文件，如果没有放入内存的数组（currentWriteBlock）中。所以数据可能文件中有，内存中也有，也可能是只有内存中有。

读取时：
（1）first
如果文件中有，则读取文件中的数据，返回第一条，如果没有就读取内存中的值，返回第一条。
（2）next
如果文件中有，则读取文件中的数据，没有就读取内存中的数据。

public class JoinOperator extends CommonJoinOperator<JoinDesc> implements
    Serializable {

    protected void initializeOp(Configuration hconf) throws HiveException {
          super.initializeOp(hconf); // CommonJoinOperator初始化
    }

}

JoinOperator：
startGroup
@Override
public void startGroup() throws HiveException {
    LOG.trace("Join: Starting new group");
    newGroupStarted = true; //一个新的key
    for (AbstractRowContainer<ArrayList<Object>> alw : storage.values()) {
      alw.clear(); // RowContainer清空。
    }
}
endGroup
/**
   * Forward a record of join results.
   *
   * @throws HiveException
   */
@Override
public void endGroup() throws HiveException {
    // if this is a skew key, we need to handle it in a separate map reduce job.
    if (handleSkewJoin && skewJoinKeyContext.currBigKeyTag >= 0) {
      try {
        skewJoinKeyContext.endGroup();
      } catch (IOException e) {
        LOG.error(e.getMessage(), e);
        throw new HiveException(e);
      }
      return;
    } else {
      checkAndGenObject();
    }
}

JoinOperator ：
public void processOp(Object row, int tag) throws HiveException {
    try {

      // get alias
      alias = (byte) tag; //从那个表来的数据。

      if ((lastAlias == null) || (!lastAlias.equals(alias))) {
        nextSz = joinEmitInterval; //默认为1000
      }

      ArrayList<Object> nr = JoinUtil.computeValues(row, joinValues.get(alias),
          joinValuesObjectInspectors.get(alias), joinFilters.get(alias),
          joinFilterObjectInspectors.get(alias), noOuterJoin); // nr计算出来的value.

      if (handleSkewJoin) {
        skewJoinKeyContext.handleSkew(tag);
      }

      // number of rows for the key in the given table
      int sz = storage.get(alias).size(); //表中当前有多少条记录
      StructObjectInspector soi = (StructObjectInspector) inputObjInspectors[tag];
      StructField sf = soi.getStructFieldRef(Utilities.ReduceField.KEY
          .toString());
      Object keyObject = soi.getStructFieldData(row, sf);

      // Are we consuming too much memory
      if (alias == numAliases - 1 && !(handleSkewJoin && skewJoinKeyContext.currBigKeyTag >= 0)) {
        if (sz == joinEmitInterval) {
          // The input is sorted by alias, so if we are already in the last join
          // operand,
          // we can emit some results now.
          // Note this has to be done before adding the current row to the
          // storage,
          // to preserve the correctness for outer joins.
          checkAndGenObject(); //先输出部分结果
          storage.get(alias).clear(); //清空本table对应的RowContainer中的数据
        }
      } else {
        if (sz == nextSz) {
          // Output a warning if we reached at least 1000 rows for a join
          // operand
          // We won't output a warning for the last join operand since the size
          // will never goes to joinEmitInterval.
          LOG.warn("table " + alias + " has " + sz + " rows for join key "
              + keyObject);
          nextSz = getNextSize(nextSz);
        }
      }

      // Add the value to the vector
      storage.get(alias).add(nr); //添加到RowContainer中。
      // if join-key is null, process each row in different group.
      if (SerDeUtils.hasAnyNullObject(keyObject, sf.getFieldObjectInspector())) {
        endGroup();
        startGroup();
      }
    } catch (Exception e) {
      e.printStackTrace();
      throw new HiveException(e);
    }
}

package org.apache.hadoop.hive.ql.exec.persistence：
public class RowContainer<Row extends List<Object>> extends AbstractRowContainer<Row>{

add
写入磁盘的row数目一定是blockSize的整数倍，否则不会写入文件，而是存在currentWriteBlock中。
@Override
public void add(Row t) throws HiveException {
    if (this.tblDesc != null) {
      if (addCursor >= blockSize) { // spill the current block to tmp file   addCursor大于等于blockSize，blockSize默认是25000，数组中已经满了，写入磁盘的文件中
        spillBlock(currentWriteBlock, addCursor);
        addCursor = 0;
        if (numFlushedBlocks == 1) {
          currentWriteBlock = (Row[]) new ArrayList[blockSize];
        }
      }
      currentWriteBlock[addCursor++] = t; //写到currentWriteBlock里，addCursor++
    } else if (t != null) {
      // the tableDesc will be null in the case that all columns in that table
      // is not used. we use a dummy row to denote all rows in that table, and
      // the dummy row is added by caller.
      this.dummyRow = t;
    }
    ++size; //个数
}

}

spillBlock
private void spillBlock(Row[] block, int length) throws HiveException {
    try {
      if (tmpFile == null) { //临时文件

        String suffix = ".tmp";
        if (this.keyObject != null) {
          suffix = "." + this.keyObject.toString() + suffix;
        }

        while (true) { //创建临时目录
          parentFile = File.createTempFile("hive-rowcontainer", "");
          boolean success = parentFile.delete() && parentFile.mkdir();
          if (success) {
            break;
          }
          LOG.debug("retry creating tmp row-container directory...");
        }

        tmpFile = File.createTempFile("RowContainer", suffix, parentFile);
        LOG.info("RowContainer created temp file " + tmpFile.getAbsolutePath());
        // Delete the temp file if the JVM terminate normally through Hadoop job
        // kill command.
        // Caveat: it won't be deleted if JVM is killed by 'kill -9'.
        parentFile.deleteOnExit();
        tmpFile.deleteOnExit();

        // rFile = new RandomAccessFile(tmpFile, "rw");
        HiveOutputFormat<?, ?> hiveOutputFormat = tblDesc.getOutputFileFormatClass().newInstance();
        tempOutPath = new Path(tmpFile.toString());
        JobConf localJc = getLocalFSJobConfClone(jc);
        rw = HiveFileFormatUtils.getRecordWriter(this.jobCloneUsingLocalFs, hiveOutputFormat, serde
            .getSerializedClass(), false, tblDesc.getProperties(), tempOutPath);
      } else if (rw == null) {
        throw new HiveException("RowContainer has already been closed for writing.");
      }

      row.clear();
      row.add(null);
      row.add(null);

      if (this.keyObject != null) {
        row.set(1, this.keyObject);
        for (int i = 0; i < length; ++i) {
          Row currentValRow = block[i];
          row.set(0, currentValRow);
          Writable outVal = serde.serialize(row, standardOI);
          rw.write(outVal);
        }
      } else {
        for (int i = 0; i < length; ++i) { //把数组中的row写入文件中。
          Row currentValRow = block[i];
          Writable outVal = serde.serialize(currentValRow, standardOI);
          rw.write(outVal); //写入
        }
      }

      if (block == this.currentWriteBlock) { //如果相等，currentWriteBlock已经写入文件
        this.addCursor = 0; //置位。
      }

      this.numFlushedBlocks++;
    } catch (Exception e) {
      clear();
      LOG.error(e.toString(), e);
      throw new HiveException(e);
    }
}

使用：
* for ( v = rowContainer.first(); v != null; v = rowContainer.next()) {
*   // do anything with v
* }
*
first
public Row first() throws HiveException {
    if (size == 0) { //每次add时，size会加1
      return null;
    }

    try {
      firstCalled = true; //
      // when we reach here, we must have some data already (because size >0).
      // We need to see if there are any data flushed into file system. If not,
      // we can
      // directly read from the current write block. Otherwise, we need to read
      // from the beginning of the underlying file.
      this.itrCursor = 0;
      closeWriter(); //关闭RecordWriter
      closeReader(); //关闭RecordReader

      if (tblDesc == null) {
        this.itrCursor++;
        return dummyRow;
      }

      this.currentReadBlock = this.firstReadBlockPointer;
      if (this.numFlushedBlocks == 0) { //如果
        this.readBlockSize = this.addCursor; //需要读取的长度
        this.currentReadBlock = this.currentWriteBlock; // 赋值
      } else {
        JobConf localJc = getLocalFSJobConfClone(jc);
        if (inputSplits == null) {
          if (this.inputFormat == null) {
            inputFormat = (InputFormat<WritableComparable, Writable>) ReflectionUtils.newInstance(
                tblDesc.getInputFileFormatClass(), localJc);
          }

          HiveConf.setVar(localJc, HiveConf.ConfVars.HADOOPMAPREDINPUTDIR,
              org.apache.hadoop.util.StringUtils.escapeString(parentFile.getAbsolutePath()));
          inputSplits = inputFormat.getSplits(localJc, 1);
          acutalSplitNum = inputSplits.length;
        }
        currentSplitPointer = 0;
        rr = inputFormat.getRecordReader(inputSplits[currentSplitPointer], localJc, Reporter.NULL);
        currentSplitPointer++;

        nextBlock();
      }
      // we are guaranteed that we can get data here (since 'size' is not zero)
      Row ret = currentReadBlock[itrCursor++]; //返回地一行数据
      removeKeys(ret);
      return ret;
    } catch (Exception e) {
      throw new HiveException(e);
    }

}

next
public Row next() throws HiveException {

    if (!firstCalled) { //如果first还没有被调用
      throw new RuntimeException("Call first() then call next().");
    }

    if (size == 0) {
      return null;
    }

    if (tblDesc == null) {
      if (this.itrCursor < size) {
        this.itrCursor++;
        return dummyRow;
      }
      return null;
    }

    Row ret;
    if (itrCursor < this.readBlockSize) { //currentReadBlock中的数据还没有读取完
      ret = this.currentReadBlock[itrCursor++];
      removeKeys(ret);
      return ret;
    } else { //currentReadBlock中的数据读取完了。
      nextBlock(); //读取写一个block
      if (this.readBlockSize == 0) { //文件中的数据已经读取完了
        if (currentWriteBlock != null && currentReadBlock != currentWriteBlock) { //currentWriteBlock中的数据没有读取过
          this.itrCursor = 0;
          this.readBlockSize = this.addCursor;
          this.firstReadBlockPointer = this.currentReadBlock;
          currentReadBlock = currentWriteBlock;
        } else { // currentWriteBlock中的数据已经读取过了
          return null;
        }
      }
      return next();
    }
}

nextBlock
private boolean nextBlock() throws HiveException {
    itrCursor = 0; //复位
    this.readBlockSize = 0; //复位
    if (this.numFlushedBlocks == 0) { //没有数据写入文件，返回false
      return false;
    }

    try {
      if (val == null) {
        val = serde.getSerializedClass().newInstance();
      }
      boolean nextSplit = true;
      int i = 0;

      if (rr != null) {
        Object key = rr.createKey();
        while (i < this.currentReadBlock.length && rr.next(key, val)) { //读取出来放入currentReadBlock中
          nextSplit = false;
          this.currentReadBlock[i++] = (Row) ObjectInspectorUtils.copyToStandardObject(serde
              .deserialize(val), serde.getObjectInspector(), ObjectInspectorCopyOption.WRITABLE);
        }
      }

      if (nextSplit && this.currentSplitPointer < this.acutalSplitNum) {
        JobConf localJc = getLocalFSJobConfClone(jc);
        // open record reader to read next split
        rr = inputFormat.getRecordReader(inputSplits[currentSplitPointer], jobCloneUsingLocalFs,
            Reporter.NULL);
        currentSplitPointer++;
        return nextBlock();
      }

      this.readBlockSize = i; //读取的长度
      return this.readBlockSize > 0;
    } catch (Exception e) {
      LOG.error(e.getMessage(), e);
      try {
        this.clear();
      } catch (HiveException e1) {
        LOG.error(e.getMessage(), e);
      }
      throw new HiveException(e);
    }
}

分享到：

hive 两个不同类型的columns进行比较 | hive 中间结果和结果数据压缩

2011-09-13 21:36
浏览 2491
评论(0)
分类:开源软件
查看更多

发表评论

您还没有登录,请您登录后再发表评论

最近访客更多访客>>

博主相关

文章分类

社区版块

存档分类

最新评论