| 36 | |
| 37 | |
| 38 | |
| 39 | == 5st (5/28) == |
| 40 | === rock === |
| 41 | Slave 安裝程式demo |
| 42 | === fafa === |
| 43 | Master 安裝程式demo |
| 44 | === waue === |
| 45 | * 討論 web 要用 [http://wiki.apache.org/tomcat/UsingPhp tomcat 5 + php 4 ] 或 tomcat 6 + jsp |
| 46 | * 討論 目錄架構 |
| 47 | |
| 48 | * [http://trac.nchc.org.tw/cloud/export/124/nutchez-0.2/package/nutchez-0.2-20100524.tar.gz 下載修改後 nutch 叢集版 的壓縮檔] |
| 49 | * 設定叢集驅動模式( /opt/nutchez/nutch/conf/ 的 hadoop-site.xml ) |
| 50 | {{{ |
| 51 | #!xml |
| 52 | <configuration> |
| 53 | <property> |
| 54 | <name>fs.default.name</name> |
| 55 | <value>hdfs://localhost:9000</value> |
| 56 | </property> |
| 57 | <property> |
| 58 | <name>mapred.job.tracker</name> |
| 59 | <value>localhost:9001</value> |
| 60 | </property> |
| 61 | <property> |
| 62 | <name>hadoop.tmp.dir</name> |
| 63 | <value>/var/nutchez/nutch-nutchuser</value> |
| 64 | </property> |
| 65 | </configuration> |
| 66 | }}} |
| 67 | * 設定 最後的搜尋結果 ( /opt/nutchez/tomcat/webapps/ROOT/WEB-INF/classes/ 的 nutch-site.xml ) |
| 68 | {{{ |
| 69 | #!xml |
| 70 | <configuration> |
| 71 | <property> |
| 72 | <name>searcher.dir</name> |
| 73 | <value>/home/nutchuser/nutchez/search</value> |
| 74 | </property> |
| 75 | </configuration> |
| 76 | }}} |
| 77 | * 使 nutch 主程式引入環境變數 (改 /opt/nutchez/nutch/bin/nutch ) |
| 78 | {{{ |
| 79 | #!sh |
| 80 | NUTCH_HOME=/opt/nutchez/nutch |
| 81 | NUTCH_CONF_DIR=/opt/nutchez/nutch/conf |
| 82 | NUTCH_LOG_DIR=/var/nutchez/logs |
| 83 | }}} |
| 84 | * 叢集版的 nutch ,要使用之前,要先執行 hadoop format 與 start-all.sh |