Context Navigation

source: sample/HBaseRecord2.java @ 10

Last change on this file since 10 was 10, checked in by waue, 16 years ago
auto parse
File size: 6.7 KB

Line
1	/**
2	* Program: HBaseRecord.java
3	* Editor: Waue Chen
4	* From : NCHC. Taiwn
5	* Last Update Date: 06/13/2008
6	*/
7
8	/**
9	* Purpose :
10	* 1.Auto generate HTable
11	* 2.Parse your record and then store in HBase.
12	*
13	* HowToUse :
14	* Make sure Hadoop file system and Hbase are running correctly.
15	* 1. put test.txt in t1 directory which content is
16	---------------
17	name:locate:years
18	waue:taiwan:1981
19	shellon:taiwan:1981
20	---------------
21	* 2. hadoop_root/$ bin/hadoop dfs -put t1 t1
22	* 3. hbase_root/$ bin/hbase shell
23	* 4. hql > create table t1_table("person");
24	* 5. Come to Eclipse and run this code, and we will let database as that
25	t1_table -> person
26	----------------
27	\| name \| locate \| years \|
28	\| waue \| taiwan \| 1981 \|
29	\| shellon \| taiwan \| 1981 \|
30	----------------
31	* Check Result:
32	* Go to hbase console, type :
33	* hql > select * from t1_table;
34	08/06/06 12:20:48 INFO hbase.HTable: Creating scanner over t1_table starting at key
35	+-------------------------+-------------------------+-------------------------+
36	\| Row \| Column \| Cell \|
37	+-------------------------+-------------------------+-------------------------+
38	\| 0 \| person:locate \| locate \|
39	+-------------------------+-------------------------+-------------------------+
40	\| 0 \| person:name \| name \|
41	+-------------------------+-------------------------+-------------------------+
42	\| 0 \| person:years \| years \|
43	+-------------------------+-------------------------+-------------------------+
44	\| 19 \| person:locate \| taiwan \|
45	+-------------------------+-------------------------+-------------------------+
46	\| 19 \| person:name \| waue \|
47	+-------------------------+-------------------------+-------------------------+
48	\| 19 \| person:years \| 1981 \|
49	+-------------------------+-------------------------+-------------------------+
50	\| 36 \| person:locate \| taiwan \|
51	+-------------------------+-------------------------+-------------------------+
52	\| 36 \| person:name \| shellon \|
53	+-------------------------+-------------------------+-------------------------+
54	\| 36 \| person:years \| 1981 \|
55	+-------------------------+-------------------------+-------------------------+
56	3 row(s) in set. (0.04 sec)
57	*/
58
59
60
61
62	package tw.org.nchc.code;
63
64	import java.io.IOException;
65	import java.util.Iterator;
66
67	import org.apache.hadoop.fs.Path;
68	import org.apache.hadoop.hbase.io.ImmutableBytesWritable;
69	import org.apache.hadoop.hbase.mapred.TableReduce;
70	import org.apache.hadoop.io.LongWritable;
71	import org.apache.hadoop.io.MapWritable;
72	import org.apache.hadoop.io.Text;
73	import org.apache.hadoop.mapred.JobClient;
74	import org.apache.hadoop.mapred.JobConf;
75	import org.apache.hadoop.mapred.OutputCollector;
76	import org.apache.hadoop.mapred.Reporter;
77	import org.apache.hadoop.mapred.lib.IdentityMapper;
78	import org.apache.hadoop.mapred.lib.IdentityReducer;
79
80
81	public class HBaseRecord2 {
82
83	/* Denify parameter */
84	// one column family: person; three column qualifier: name,locate,years
85	final String colstr;
86	// Hbase table name
87	static String[] col;
88	String Table_Name = "Record1";
89	//split character
90	static String sp = ":";
91	// file path in hadoop file system (not phisical file system)
92	String file_path = "/user/waue/t1";
93
94
95
96	public HBaseRecord2(){
97	colstr ="person:name,locate,years";
98	}
99	public HBaseRecord2(String str){
100	colstr = str;
101	}
102
103
104	private static class ReduceClass extends TableReduce<LongWritable, Text> {
105
106	// Column id is created dymanically,
107	private static final Text col_name = new Text(baseId1);
108	private static final Text col_local = new Text(baseId2);
109	private static final Text col_year = new Text(baseId3);
110
111	// this map holds the columns per row
112	private MapWritable map = new MapWritable();
113
114	// on this sample, map is nonuse, we use reduce to handle
115	public void reduce(LongWritable key, Iterator<Text> values,
116	OutputCollector<Text, MapWritable> output, Reporter reporter)
117	throws IOException {
118
119	// values.next().getByte() can get value and transfer to byte form, there is an other way that let decode()
120	// to substitude getByte()
121	String stro = new String(values.next().getBytes());
122	String str[] = stro.split(sp);
123	byte b_local[] = str[0].getBytes();
124	byte b_name[] = str[1].getBytes();
125	byte b_year[] = str[2].getBytes();
126
127	// contents must be ImmutableBytesWritable
128	ImmutableBytesWritable w_local = new ImmutableBytesWritable( b_local);
129	ImmutableBytesWritable w_name = new ImmutableBytesWritable( b_name );
130	ImmutableBytesWritable w_year = new ImmutableBytesWritable( b_year );
131
132	// populate the current row
133	map.clear();
134	map.put(col_name, w_local);
135	map.put(col_local, w_name);
136	map.put(col_year, w_year);
137
138	// add the row with the key as the row id
139	output.collect(new Text(key.toString()), map);
140	}
141	}
142
143	/**
144	* Runs the demo.
145	*/
146	public static void main(String[] args) throws IOException {
147	// parse colstr to split column family and column qualify
148	HBaseRecord2 work = new HBaseRecord2();
149
150	String tmp[] = work.colstr.split(":");
151	String Column_Family = tmp[0]+":";
152	String CF[] = {Column_Family};
153	String CQ[] = tmp[2].split(",");
154	// check whether create table or not , we don't admit \
155	// the same name but different structure
156
157	BuildHTable build_table = new BuildHTable(work.Table_Name,CF);
158	if (!build_table.checkTableExist(work.Table_Name)) {
159	if (!build_table.createTable()) {
160	System.out.println("create table error !");
161	}
162	}else{
163	System.out.println("Table \"" + work.Table_Name +"\" has already existed !");
164	}
165
166	JobConf conf = new JobConf(HBaseRecord2.class);
167	int mapTasks = 1;
168	int reduceTasks = 1;
169	//Job name; you can modify to any you like
170	conf.setJobName("NCHC_PersonDataBase");
171
172	// Hbase table name must be correct , in our profile is t1_table
173	TableReduce.initJob(work.Table_Name, ReduceClass.class, conf);
174
175	// below are map-reduce profile
176	conf.setNumMapTasks(mapTasks);
177	conf.setNumReduceTasks(reduceTasks);
178	conf.setInputPath(new Path(work.file_path));
179	conf.setMapperClass(IdentityMapper.class);
180	conf.setCombinerClass(IdentityReducer.class);
181	conf.setReducerClass(ReduceClass.class);
182	JobClient.runJob(conf);
183	}
184	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats: