dain/ScanOrcFile.java

## ScanOrcFile.java
/*
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.facebook.presto.orc;

import com.facebook.presto.orc.metadata.OrcMetadataReader;
import com.facebook.presto.spi.block.Block;
import com.facebook.presto.spi.type.Type;
import com.facebook.presto.testing.TestingConnectorSession;
import com.google.common.collect.ImmutableMap;
import io.airlift.units.DataSize;
import org.joda.time.DateTimeZone;

import java.io.File;
import java.io.IOException;
import java.util.Map;
import java.util.Map.Entry;

import static com.facebook.presto.spi.type.BigintType.BIGINT;
import static com.facebook.presto.spi.type.DoubleType.DOUBLE;
import static com.facebook.presto.spi.type.VarcharType.VARCHAR;
import static io.airlift.units.DataSize.Unit.MEGABYTE;

@SuppressWarnings("UseOfSystemOutOrSystemErr")
public final class ScanOrcFile
{
    public static void main(String... args)
            throws Exception
    {
        File file = new File(args[0]);
        FileOrcDataSource orcDataSource = new FileOrcDataSource(file, new DataSize(1, MEGABYTE), new DataSize(8, MEGABYTE), new DataSize(8, MEGABYTE));
        OrcReader orcReader = new OrcReader(orcDataSource, new OrcMetadataReader(), new DataSize(1, MEGABYTE), new DataSize(8, MEGABYTE));

        //
        // Set your column types here
        //
        Map<Integer, Type> columnTypes = ImmutableMap.<Integer, Type>builder()
                .put(0, BIGINT)
                .put(1, DOUBLE)
                .put(2, VARCHAR)
                .build();
        OrcRecordReader recordReader = orcReader.createRecordReader(columnTypes, OrcPredicate.TRUE, DateTimeZone.getDefault());

        long rows = 0;
        for (int batchSize = recordReader.nextBatch(); batchSize > 0; batchSize = recordReader.nextBatch()) {
            rows += readBatch(columnTypes, recordReader);
        }
        System.out.println();
        System.out.println("rows: " + rows);
    }

    private static int readBatch(Map<Integer, Type> columnTypes, OrcRecordReader recordReader)
            throws IOException
    {
        int batchSize = recordReader.nextBatch();
        for (Entry<Integer, Type> entry : columnTypes.entrySet()) {
            Block block = recordReader.readBlock(entry.getValue(), entry.getKey());
            System.out.print(entry.getValue().getObjectValue(TestingConnectorSession.SESSION, block, 0));
            System.out.print(",");
        }
        System.out.println();
        return batchSize;
    }
}
	/*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/
	package com.facebook.presto.orc;

	import com.facebook.presto.orc.metadata.OrcMetadataReader;
	import com.facebook.presto.spi.block.Block;
	import com.facebook.presto.spi.type.Type;
	import com.facebook.presto.testing.TestingConnectorSession;
	import com.google.common.collect.ImmutableMap;
	import io.airlift.units.DataSize;
	import org.joda.time.DateTimeZone;

	import java.io.File;
	import java.io.IOException;
	import java.util.Map;
	import java.util.Map.Entry;

	import static com.facebook.presto.spi.type.BigintType.BIGINT;
	import static com.facebook.presto.spi.type.DoubleType.DOUBLE;
	import static com.facebook.presto.spi.type.VarcharType.VARCHAR;
	import static io.airlift.units.DataSize.Unit.MEGABYTE;

	@SuppressWarnings("UseOfSystemOutOrSystemErr")
	public final class ScanOrcFile
	{
	public static void main(String... args)
	throws Exception
	{
	File file = new File(args[0]);
	FileOrcDataSource orcDataSource = new FileOrcDataSource(file, new DataSize(1, MEGABYTE), new DataSize(8, MEGABYTE), new DataSize(8, MEGABYTE));
	OrcReader orcReader = new OrcReader(orcDataSource, new OrcMetadataReader(), new DataSize(1, MEGABYTE), new DataSize(8, MEGABYTE));

	//
	// Set your column types here
	//
	Map<Integer, Type> columnTypes = ImmutableMap.<Integer, Type>builder()
	.put(0, BIGINT)
	.put(1, DOUBLE)
	.put(2, VARCHAR)
	.build();
	OrcRecordReader recordReader = orcReader.createRecordReader(columnTypes, OrcPredicate.TRUE, DateTimeZone.getDefault());

	long rows = 0;
	for (int batchSize = recordReader.nextBatch(); batchSize > 0; batchSize = recordReader.nextBatch()) {
	rows += readBatch(columnTypes, recordReader);
	}
	System.out.println();
	System.out.println("rows: " + rows);
	}

	private static int readBatch(Map<Integer, Type> columnTypes, OrcRecordReader recordReader)
	throws IOException
	{
	int batchSize = recordReader.nextBatch();
	for (Entry<Integer, Type> entry : columnTypes.entrySet()) {
	Block block = recordReader.readBlock(entry.getValue(), entry.getKey());
	System.out.print(entry.getValue().getObjectValue(TestingConnectorSession.SESSION, block, 0));
	System.out.print(",");
	}
	System.out.println();
	return batchSize;
	}
	}