This project has retired. For details please refer to its Attic page.
IntIntTextVertexValueInputFormat xref
View Javadoc

1   /*
2    * Licensed to the Apache Software Foundation (ASF) under one
3    * or more contributor license agreements.  See the NOTICE file
4    * distributed with this work for additional information
5    * regarding copyright ownership.  The ASF licenses this file
6    * to you under the Apache License, Version 2.0 (the
7    * "License"); you may not use this file except in compliance
8    * with the License.  You may obtain a copy of the License at
9    *
10   *     http://www.apache.org/licenses/LICENSE-2.0
11   *
12   * Unless required by applicable law or agreed to in writing, software
13   * distributed under the License is distributed on an "AS IS" BASIS,
14   * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15   * See the License for the specific language governing permissions and
16   * limitations under the License.
17   */
18  
19  package org.apache.giraph.io.formats;
20  
21  import org.apache.giraph.utils.IntPair;
22  import org.apache.hadoop.io.IntWritable;
23  import org.apache.hadoop.io.Text;
24  import org.apache.hadoop.io.Writable;
25  import org.apache.hadoop.mapreduce.InputSplit;
26  import org.apache.hadoop.mapreduce.TaskAttemptContext;
27  
28  import java.io.IOException;
29  import java.util.regex.Pattern;
30  
31  /**
32   * Simple text-based {@link org.apache.giraph.io.VertexValueInputFormat}
33   * for integer ids and values.
34   *
35   * Each line consists of: id, value
36   *
37   * @param <E> Edge value
38   */
39  public class IntIntTextVertexValueInputFormat<E extends Writable> extends
40      TextVertexValueInputFormat<IntWritable, IntWritable, E> {
41    /** Separator for id and value */
42    private static final Pattern SEPARATOR = Pattern.compile("[\t ]");
43  
44    @Override
45    public TextVertexValueReader createVertexValueReader(
46        InputSplit split, TaskAttemptContext context) throws IOException {
47      return new IntIntTextVertexValueReader();
48    }
49  
50    /**
51     * {@link org.apache.giraph.io.VertexValueReader} associated with
52     * {@link IntIntTextVertexValueInputFormat}.
53     */
54    public class IntIntTextVertexValueReader extends
55        TextVertexValueReaderFromEachLineProcessed<IntPair> {
56  
57      @Override
58      protected IntPair preprocessLine(Text line) throws IOException {
59        String[] tokens = SEPARATOR.split(line.toString());
60        return new IntPair(Integer.parseInt(tokens[0]),
61            Integer.parseInt(tokens[1]));
62      }
63  
64      @Override
65      protected IntWritable getId(IntPair data) throws IOException {
66        return new IntWritable(data.getFirst());
67      }
68  
69      @Override
70      protected IntWritable getValue(IntPair data) throws IOException {
71        return new IntWritable(data.getSecond());
72      }
73    }
74  }