diff --git a/parquet-tools/src/main/java/parquet/tools/Main.java b/parquet-tools/src/main/java/parquet/tools/Main.java index 4613c3cff3..bfc6f62d70 100644 --- a/parquet-tools/src/main/java/parquet/tools/Main.java +++ b/parquet-tools/src/main/java/parquet/tools/Main.java @@ -153,7 +153,7 @@ public static void die(String message, boolean usage, String name, Command comma if (name != null && command != null) { showUsage(name, command); } else { - showUsage(name, command); + showUsage(); } } diff --git a/parquet-tools/src/main/java/parquet/tools/command/Registry.java b/parquet-tools/src/main/java/parquet/tools/command/Registry.java index d05fcb7973..1ccaddfd24 100644 --- a/parquet-tools/src/main/java/parquet/tools/command/Registry.java +++ b/parquet-tools/src/main/java/parquet/tools/command/Registry.java @@ -31,6 +31,7 @@ public final class Registry { registry.put("schema", ShowSchemaCommand.class); registry.put("meta", ShowMetaCommand.class); registry.put("dump", DumpCommand.class); + registry.put("rowcount", RowCountCommand.class); } public static Map allCommands() { diff --git a/parquet-tools/src/main/java/parquet/tools/command/RowCountCommand.java b/parquet-tools/src/main/java/parquet/tools/command/RowCountCommand.java new file mode 100644 index 0000000000..50169e6d6c --- /dev/null +++ b/parquet-tools/src/main/java/parquet/tools/command/RowCountCommand.java @@ -0,0 +1,121 @@ +/** + * Copyright 2013 ARRIS, Inc. + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ +package parquet.tools.command; + +import org.apache.commons.cli.CommandLine; +import org.apache.commons.cli.Option; +import org.apache.commons.cli.OptionBuilder; +import org.apache.commons.cli.Options; +import org.apache.hadoop.conf.Configuration; +import org.apache.hadoop.fs.Path; +import org.apache.hadoop.fs.FileStatus; + +import parquet.hadoop.Footer; +import parquet.hadoop.ParquetFileReader; +import parquet.hadoop.metadata.BlockMetaData; +import parquet.hadoop.metadata.ParquetMetadata; +import parquet.schema.MessageType; +import parquet.tools.Main; +import parquet.tools.util.PrettyPrintWriter; +import parquet.tools.util.PrettyPrintWriter.WhiteSpaceHandler; + +import com.google.common.base.Joiner; +import java.util.List; +import java.util.ArrayList; + +public class RowCountCommand extends ArgsOnlyCommand { + public static final String[] USAGE = new String[] { + "", + "where is the parquet file containing the row counts to show" + }; + + public static final Options OPTIONS; + static { + OPTIONS = new Options(); + Option detail = OptionBuilder.withLongOpt("detailed") + .withDescription("Show the individual row counts.") + .create('d'); + OPTIONS.addOption(detail); + } + + public RowCountCommand() { + super(1, 1); + } + + @Override + public String[] getUsageDescription() { + return USAGE; + } + + @Override + public Options getOptions() { + return OPTIONS; + } + + @Override + public void execute(CommandLine options) throws Exception { + super.execute(options); + + String[] args = options.getArgs(); + String input = args[0]; + + Configuration conf = new Configuration(); + Path inputPath = new Path(input); + FileStatus inputFileStatus = inputPath.getFileSystem(conf).getFileStatus(inputPath); + List