Package com.hp.hpl.jena.tdb.store.bulkloader2

Source Code of com.hp.hpl.jena.tdb.store.bulkloader2.CmdIndexBuild

/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements.  See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership.  The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License.  You may obtain a copy of the License at
*
*     http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/

package com.hp.hpl.jena.tdb.store.bulkloader2;

import java.io.InputStream ;
import java.util.Arrays ;
import java.util.Iterator ;

import org.openjena.atlas.AtlasException ;
import org.openjena.atlas.io.IO ;
import org.openjena.atlas.lib.ColumnMap ;
import org.openjena.atlas.logging.Log ;
import tdb.cmdline.CmdTDB ;

import com.hp.hpl.jena.tdb.base.block.BlockMgr ;
import com.hp.hpl.jena.tdb.base.block.BlockMgrFactory ;
import com.hp.hpl.jena.tdb.base.file.FileSet ;
import com.hp.hpl.jena.tdb.base.file.Location ;
import com.hp.hpl.jena.tdb.base.record.Record ;
import com.hp.hpl.jena.tdb.base.record.RecordFactory ;
import com.hp.hpl.jena.tdb.index.bplustree.BPlusTree ;
import com.hp.hpl.jena.tdb.index.bplustree.BPlusTreeParams ;
import com.hp.hpl.jena.tdb.index.bplustree.BPlusTreeRewriter ;
import com.hp.hpl.jena.tdb.sys.Names ;
import com.hp.hpl.jena.tdb.sys.SystemTDB ;

/** From a file of records, build a (packed) index */
public class CmdIndexBuild
{
    static { Log.setLog4j() ; }
   
    public static void main(String...argv)
    {
        CmdTDB.setLogging() ;
        // DATA IN S/P/O columns but sorted by index order.
       
        if ( argv.length != 3 )
        {
            System.err.println("Usage: Location Index dataFile") ;
            System.exit(1) ;
        }
       
        String locationStr = argv[0] ;
        String indexName = argv[1] ;
        if ( ! Arrays.asList(Names.tripleIndexes).contains(indexName) &&
            ! Arrays.asList(Names.quadIndexes).contains(indexName) )
//       
//        if ( !indexName.equals("SPO") && !indexName.equals("POS") && !indexName.equals("OSP") )
        {
            System.err.println("Index name not recognized: "+indexName) ;
            System.exit(1) ;
        }
           
        String dataFile = argv[2] ;
       
        // Argument processing
       
        Location location = new Location(locationStr) ;
       
        //InputStream input = System.in ;
        InputStream input = IO.openFile(dataFile) ;
       
        int keyLength = SystemTDB.SizeOfNodeId * indexName.length() ;
        int valueLength = 0 ;
       
        // The name is the order.
        String primary = indexName ; 
       
        // Scope for optimization:
        // Null column map => no churn.
        // Do record -> record copy, not Tuple, Tuple copy.

        String primaryOrder ;
        int dftKeyLength ;
        int dftValueLength ;
        int tupleLength = indexName.length() ;

        if ( tupleLength == 3 )
        {
            primaryOrder = Names.primaryIndexTriples ;
            dftKeyLength = SystemTDB.LenIndexTripleRecord ;
            dftValueLength = 0 ;
        }
        else if ( tupleLength == 4 )
        {
            primaryOrder = Names.primaryIndexQuads ;
            dftKeyLength = SystemTDB.LenIndexQuadRecord ;
            dftValueLength = 0 ;
        }
        else
        {
            throw new AtlasException("Index name: "+indexName) ;
        }
       
        ColumnMap colMap = new ColumnMap(primaryOrder, indexName) ;


        // -1? Write only.
        // Also flush cache every so often => block writes (but not sequential so boring).
        int readCacheSize = 10 ;
        int writeCacheSize = 100 ;

        int blockSize = SystemTDB.BlockSize ;
        RecordFactory recordFactory = new RecordFactory(dftKeyLength, dftValueLength) ;
       
        int order = BPlusTreeParams.calcOrder(blockSize, recordFactory) ;
        BPlusTreeParams bptParams = new BPlusTreeParams(order, recordFactory) ;

        int blockSizeNodes = blockSize ;
        int blockSizeRecords = blockSize ;

        FileSet destination = new FileSet(location, indexName) ;

        BlockMgr blkMgrNodes = BlockMgrFactory.create(destination, Names.bptExtTree, blockSizeNodes, readCacheSize, writeCacheSize) ;
        BlockMgr blkMgrRecords = BlockMgrFactory.create(destination, Names.bptExtRecords, blockSizeRecords, readCacheSize, writeCacheSize) ;
       
        int rowBlock = 1000 ;
        Iterator<Record> iter = new RecordsFromInput(input, tupleLength, colMap, rowBlock) ;
        BPlusTree bpt2 = BPlusTreeRewriter.packIntoBPlusTree(iter, bptParams, recordFactory, blkMgrNodes, blkMgrRecords) ;
        bpt2.close() ;
    }
}
TOP

Related Classes of com.hp.hpl.jena.tdb.store.bulkloader2.CmdIndexBuild

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.