This project has retired. For details please refer to its Attic page.
GiraphTextInputFormat xref
View Javadoc

1   /*
2    * Licensed to the Apache Software Foundation (ASF) under one
3    * or more contributor license agreements.  See the NOTICE file
4    * distributed with this work for additional information
5    * regarding copyright ownership.  The ASF licenses this file
6    * to you under the Apache License, Version 2.0 (the
7    * "License"); you may not use this file except in compliance
8    * with the License.  You may obtain a copy of the License at
9    *
10   *     http://www.apache.org/licenses/LICENSE-2.0
11   *
12   * Unless required by applicable law or agreed to in writing, software
13   * distributed under the License is distributed on an "AS IS" BASIS,
14   * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15   * See the License for the specific language governing permissions and
16   * limitations under the License.
17   */
18  
19  package org.apache.giraph.io.formats;
20  
21  import org.apache.hadoop.fs.Path;
22  import org.apache.hadoop.io.LongWritable;
23  import org.apache.hadoop.io.Text;
24  import org.apache.hadoop.io.compress.CompressionCodec;
25  import org.apache.hadoop.io.compress.CompressionCodecFactory;
26  import org.apache.hadoop.mapreduce.InputSplit;
27  import org.apache.hadoop.mapreduce.JobContext;
28  import org.apache.hadoop.mapreduce.RecordReader;
29  import org.apache.hadoop.mapreduce.TaskAttemptContext;
30  import org.apache.hadoop.mapreduce.lib.input.LineRecordReader;
31  
32  /**
33   * Provides functionality similar to
34   * {@link org.apache.hadoop.mapreduce.lib.input.TextInputFormat},
35   * but allows for different data sources (vertex and edge data).
36   */
37  public class GiraphTextInputFormat
38      extends GiraphFileInputFormat<LongWritable, Text> {
39    @Override
40    public RecordReader<LongWritable, Text>
41    createRecordReader(InputSplit split, TaskAttemptContext context) {
42      return new LineRecordReader();
43    }
44  
45    @Override
46    protected boolean isSplitable(JobContext context, Path file) {
47      CompressionCodec codec =
48          new CompressionCodecFactory(context.getConfiguration()).getCodec(file);
49      return codec == null;
50    }
51  }