Context Navigation

← Previous Changeset
Next Changeset →

Changeset 18

Timestamp:

Jul 2, 2008, 3:10:09 PM (17 years ago)

Author:

waue

Message:

upgrade 0.16 to 0.17

Location:

Files:

: 6 edited

HBaseRecord.java (modified) (6 diffs)
HBaseRecord2.java (modified) (4 diffs)
HBaseRecordPro.java (modified) (3 diffs)
WordCount.java (modified) (6 diffs)
WordCountFromHBase.java (modified) (3 diffs)
WordCountIntoHBase.java (modified) (5 diffs)

Legend:

: Unmodified
: Added
: Removed

sample/HBaseRecord.java

-                      r9
+                      r18
  * Editor: Waue Chen
  * From :  NCHC. Taiwn
+ * Last Update Date: 06/01/2008
+ * Last Update Date: 07/02/2008
+ * Upgrade to 0.17
  */
 …
  *  Make sure Hadoop file system and Hbase are running correctly.
  *  1. put test.txt in t1 directory which content is
   ---------------
   name:locate:years
   waue:taiwan:1981
   shellon:taiwan:1981
   ---------------
+ ---------------
+ name:locate:years
+ waue:taiwan:1981
+ shellon:taiwan:1981
+ ---------------
  *  2. hadoop_root/$ bin/hadoop dfs -put t1 t1
  *  3. hbase_root/$ bin/hbase shell
  *  4. hql > create table t1_table("person");
  *  5. Come to Eclipse and run this code, and we will let database as that
   t1_table -> person
     ----------------
     |  name | locate | years |
     | waue  | taiwan | 1981 |
     | shellon | taiwan | 1981 |
     ----------------
+ t1_table -> person
+ ----------------
+ |  name | locate | years |
+ | waue  | taiwan | 1981 |
+ | shellon | taiwan | 1981 |
+ ----------------
  * Check Result:
  *  Go to hbase console, type :
  *    hql > select * from t1_table;
 /06/06 12:20:48 INFO hbase.HTable: Creating scanner over t1_table starting at key
 +-------------------------+-------------------------+-------------------------+
 | Row                     | Column                  | Cell                    |
 +-------------------------+-------------------------+-------------------------+
 | 0                       | person:locate           | locate                  |
 +-------------------------+-------------------------+-------------------------+
 | 0                       | person:name             | name                    |
 +-------------------------+-------------------------+-------------------------+
 | 0                       | person:years            | years                   |
 +-------------------------+-------------------------+-------------------------+
 | 19                      | person:locate           | taiwan                  |
 +-------------------------+-------------------------+-------------------------+
 | 19                      | person:name             | waue                    |
 +-------------------------+-------------------------+-------------------------+
 | 19                      | person:years            | 1981                    |
 +-------------------------+-------------------------+-------------------------+
 | 36                      | person:locate           | taiwan                  |
 +-------------------------+-------------------------+-------------------------+
 | 36                      | person:name             | shellon                 |
 +-------------------------+-------------------------+-------------------------+
 | 36                      | person:years            | 1981                    |
 +-------------------------+-------------------------+-------------------------+
 row(s) in set. (0.04 sec)
+/06/06 12:20:48 INFO hbase.HTable: Creating scanner over t1_table starting at key
+ +-------------------------+-------------------------+-------------------------+
+ | Row                     | Column                  | Cell                    |
+ +-------------------------+-------------------------+-------------------------+
+ | 0                       | person:locate           | locate                  |
+ +-------------------------+-------------------------+-------------------------+
+ | 0                       | person:name             | name                    |
+ +-------------------------+-------------------------+-------------------------+
+ | 0                       | person:years            | years                   |
+ +-------------------------+-------------------------+-------------------------+
+ | 19                      | person:locate           | taiwan                  |
+ +-------------------------+-------------------------+-------------------------+
+ | 19                      | person:name             | waue                    |
+ +-------------------------+-------------------------+-------------------------+
+ | 19                      | person:years            | 1981                    |
+ +-------------------------+-------------------------+-------------------------+
+ | 36                      | person:locate           | taiwan                  |
+ +-------------------------+-------------------------+-------------------------+
+ | 36                      | person:name             | shellon                 |
+ +-------------------------+-------------------------+-------------------------+
+ | 36                      | person:years            | 1981                    |
+ +-------------------------+-------------------------+-------------------------+
+row(s) in set. (0.04 sec)
  */
 package tw.org.nchc.code;
 …
 import org.apache.hadoop.mapred.lib.IdentityReducer;
 public class HBaseRecord {
   /* Denify parameter */
   // one column family: person; three column qualifier: name,locate,years
+  static private String  baseId1 ="person:name";
+  static private String  baseId2 ="person:locate";
+  static private String  baseId3 ="person:years";
+  //split character
+  static private String baseId1 = "person:name";
+  static private String baseId2 = "person:locate";
+  static private String baseId3 = "person:years";
+  // split character
   static private String sp = ":";
   // file path in hadoop file system (not phisical file system)
   String file_path = "/user/waue/t1";
   // Hbase table name
   String table_name = "t1_table";
   // setup MapTask and Reduce Task
   int mapTasks = 1;
   int reduceTasks = 1;
   private static class ReduceClass extends TableReduce<LongWritable, Text> {
     // Column id is created dymanically,
+    // Column id is created dymanically,
     private static final Text col_name = new Text(baseId1);
     private static final Text col_local = new Text(baseId2);
     private static final Text col_year = new Text(baseId3);
     // this map holds the columns per row
     private MapWritable map = new MapWritable();
+    private MapWritable map = new MapWritable();
     // on this sample, map is nonuse, we use reduce to handle
     public void reduce(LongWritable key, Iterator<Text> values,
 …
         throws IOException {
+      // values.next().getByte() can get value and transfer to byte form, there is an other way that let decode()
+      // to substitude getByte()
+      // values.next().getByte() can get value and transfer to byte form,
+      // there is an other way that let decode()
+      // to substitude getByte()
       String stro = new String(values.next().getBytes());
       String str[] = stro.split(sp);
 …
       byte b_name[] = str[1].getBytes();
       byte b_year[] = str[2].getBytes();
       // contents must be ImmutableBytesWritable
       ImmutableBytesWritable w_local = new ImmutableBytesWritable( b_local);
       ImmutableBytesWritable w_name = new ImmutableBytesWritable( b_name );
       ImmutableBytesWritable w_year = new ImmutableBytesWritable( b_year );
+      ImmutableBytesWritable w_local = new ImmutableBytesWritable(b_local);
+      ImmutableBytesWritable w_name = new ImmutableBytesWritable(b_name);
+      ImmutableBytesWritable w_year = new ImmutableBytesWritable(b_year);
       // populate the current row
 …
    */
   public static void main(String[] args) throws IOException {
     // which path of input files in Hadoop file system
+    // which path of input files in Hadoop file system
     HBaseRecord setup = new HBaseRecord();
     JobConf conf = new JobConf(HBaseRecord.class);
     //Job name; you can modify to any you like
+    // Job name; you can modify to any you like
     conf.setJobName("NCHC_PersonDataBase");
     // Hbase table name must be correct , in our profile is t1_table
     TableReduce.initJob(setup.table_name, ReduceClass.class, conf);
     // below are map-reduce profile
     conf.setNumMapTasks(setup.mapTasks);
     conf.setNumReduceTasks(setup.reduceTasks);
+    conf.setInputPath(new Path(setup.file_path));
+    // 0.16
+    // conf.setInputPath(new Path(setup.file_path));
+    Convert.setInputPath(conf, new Path(setup.file_path));
     conf.setMapperClass(IdentityMapper.class);
     conf.setCombinerClass(IdentityReducer.class);

sample/HBaseRecord2.java

-                      r14
+                      r18
  * Editor: Waue Chen
  * From :  NCHC. Taiwn
+ * Last Update Date: 06/01/2008
+ * Last Update Date: 07/01/2008
+ * Upgrade to 0.17
  */
 …
 package tw.org.nchc.code;
-import java.io.FileInputStream;
 import java.io.IOException;
 import java.util.Iterator;
 …
           + "\" has already existed !");
+    }
-    FileInputStream fi = new FileInputStream(setup.file_path);
     JobConf conf = new JobConf(HBaseRecord2.class);
 …
     conf.setNumMapTasks(setup.mapTasks);
     conf.setNumReduceTasks(setup.reduceTasks);
+    conf.setInputPath(new Path(setup.file_path));
+    // 0.16
+//    conf.setInputPath(new Path(setup.file_path));
+    Convert.setInputPath(conf, new Path(setup.file_path));
     conf.setMapperClass(IdentityMapper.class);
     conf.setCombinerClass(IdentityReducer.class);

sample/HBaseRecordPro.java

-                      r17
+                      r18
 /**
  * Program: HBaseRecord.java
+ * Program: HBaseRecordPro.java
  * Editor: Waue Chen
  * From :  NCHC. Taiwn
+ * Last Update Date: 06/01/2008
+ * Last Update Date: 07/02/2008
+ * Upgrade to 0.17
  */
 …
     conf.setNumMapTasks(mapTasks);
     conf.setNumReduceTasks(reduceTasks);
+    conf.setInputPath(text_path);
+    // 0.16
+//    conf.setInputPath(text_path);
+    Convert.setInputPath(conf, text_path);
     conf.setMapperClass(IdentityMapper.class);
     conf.setCombinerClass(IdentityReducer.class);
 …
     // delete tmp file
+    FileSystem.get(conf).delete(text_path);
+    // 0.16
+//    FileSystem.get(conf).delete(text_path);
+    FileSystem.get(conf).delete(text_path,true);
     setup.deleteFile(conf_tmp);
+  }

sample/WordCount.java

-                      r9
+                      r18
  * Editor: Waue Chen
  * From :  NCHC. Taiwn
+ * Last Update Date: 06/13/2008
+ * Last Update Date: 07/02/2008
+ * Upgrade to 0.17
  */
 …
 import org.apache.hadoop.mapred.Reporter;
 public class WordCount {
   private String filepath;
   private String outputPath;
   public WordCount(){
+  public WordCount() {
     filepath = "/user/waue/input/";
     outputPath = "counts1";
+  }
+  public WordCount(String path,String output){
+  public WordCount(String path, String output) {
     filepath = path;
     outputPath = output;
+  }
   // mapper: emits (token, 1) for every word occurrence
   private static class MapClass extends MapReduceBase implements
 …
     // reuse objects to save overhead of object creation
     private final static IntWritable one = new IntWritable(1);
     private Text word = new Text();
 …
+  }
   /**
    * Runs the demo.
 …
   public static void main(String[] args) throws IOException {
     WordCount wc = new WordCount();
     int mapTasks = 1;
     int reduceTasks = 1;
 …
     conf.setNumMapTasks(mapTasks);
     conf.setNumReduceTasks(reduceTasks);
+    conf.setInputPath(new Path(wc.filepath));
+    // 0.16
+    // conf.setInputPath(new Path(wc.filepath));
+    Convert.setInputPath(conf, new Path(wc.filepath));
     conf.setOutputKeyClass(Text.class);
     conf.setOutputValueClass(IntWritable.class);
+    conf.setOutputPath(new Path(wc.outputPath));
+    // 0.16
+    // conf.setOutputPath(new Path(wc.outputPath));
+    Convert.setOutputPath(conf, new Path(wc.outputPath));
     conf.setMapperClass(MapClass.class);
     conf.setCombinerClass(ReduceClass.class);
     conf.setReducerClass(ReduceClass.class);
     // Delete the output directory if it exists already
     Path outputDir = new Path(wc.outputPath);
+    FileSystem.get(conf).delete(outputDir);
+    // 0.16
+    FileSystem.get(conf).delete(outputDir,true);
     JobClient.runJob(conf);

sample/WordCountFromHBase.java

-                      r9
+                      r18
  * Editor: Waue Chen
  * From :  NCHC. Taiwn
+ * Last Update Date: 06/13/2008
+ * Last Update Date: 07/02/2008
+ * Upgrade to 0.17
  */
 …
 import java.util.Iterator;
 import java.util.StringTokenizer;
+import java.io.FileOutputStream;
+import java.io.File;
+import java.io.RandomAccessFile;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.Path;
 …
     // input is Hbase format => TableInputFormat
     conf.setInputFormat(TableInputFormat.class);
+    conf.setOutputPath(new Path(outputPath));
+    // 0.16
+//    conf.setOutputPath(new Path(outputPath));
+    Convert.setOutputPath(conf, new Path(outputPath));
 //     delete the old path with the same name
     FileSystem.get(conf).delete(new Path(outputPath));
+    FileSystem.get(conf).delete(new Path(outputPath),true);
     JobClient.runJob(conf);
+  }

sample/WordCountIntoHBase.java

-                      r8
+                      r18
  * Editor: Waue Chen
  * From :  NCHC. Taiwn
+ * Last Update Date: 06/10/2008
+ * Last Update Date: 07/02/2008
+ * Upgrade to 0.17
  */
 …
   /* setup parameters */
+  // $Input_Path. Please make sure the path is correct and contains input files
+  // $Input_Path. Please make sure the path is correct and contains input
+  // files
   static final String Input_Path = "/user/waue/simple";
   // Hbase table name, the program will create it
   static final String Table_Name = "word_count5";
   // column name, the program will create it
   static final String colstr = "word:text" ;
+  static final String colstr = "word:text";
   // constructor
   private WordCountIntoHBase() {
 …
     // set (column_family:column_qualify)
     private static final Text col = new Text(WordCountIntoHBase.colstr);
     // this map holds the columns per row
     private MapWritable map = new MapWritable();
     public void reduce(LongWritable key, Iterator<Text> values,
         OutputCollector<Text, MapWritable> output, Reporter reporter)
         throws IOException {
       // contents must be ImmutableBytesWritable
       ImmutableBytesWritable bytes =
         new ImmutableBytesWritable(values.next().getBytes());
+      ImmutableBytesWritable bytes = new ImmutableBytesWritable(values
+          .next().getBytes());
       map.clear();
       // write data
+      // write data
       map.put(col, bytes);
       // add the row with the key as the row id
 …
    * Runs the demo.
    */
   public static void main(String[] args) throws IOException {
+  public static void main(String[] args) throws IOException {
     // parse colstr to split column family and column qualify
     String tmp[] = colstr.split(":");
     String Column_Family = tmp[0]+":";
     String CF[] = {Column_Family};
     // check whether create table or not , we don't admit \
+    String Column_Family = tmp[0] + ":";
+    String CF[] = { Column_Family };
+    // check whether create table or not , we don't admit \
     // the same name but different structure
     BuildHTable build_table = new BuildHTable(Table_Name,CF);
+    BuildHTable build_table = new BuildHTable(Table_Name, CF);
     if (!build_table.checkTableExist(Table_Name)) {
       if (!build_table.createTable()) {
         System.out.println("create table error !");
+      }
+    }else{
+      System.out.println("Table \"" + Table_Name +"\" has already existed !");
+    } else {
+      System.out.println("Table \"" + Table_Name
+          + "\" has already existed !");
+    }
     int mapTasks = 1;
 …
     conf.setNumMapTasks(mapTasks);
     conf.setNumReduceTasks(reduceTasks);
+    conf.setInputPath(new Path(Input_Path));
+    // 0.16
+    // conf.setInputPath(new Path(Input_Path));
+    Convert.setInputPath(conf, new Path(Input_Path));
     conf.setMapperClass(IdentityMapper.class);
     conf.setCombinerClass(IdentityReducer.class);

Note: See TracChangeset for help on using the changeset viewer.

Download in other formats: