| | 36 | |
| | 37 | |
| | 38 | |
| | 39 | == 5st (5/28) == |
| | 40 | === rock === |
| | 41 | Slave 安裝程式demo |
| | 42 | === fafa === |
| | 43 | Master 安裝程式demo |
| | 44 | === waue === |
| | 45 | * 討論 web 要用 [http://wiki.apache.org/tomcat/UsingPhp tomcat 5 + php 4 ] 或 tomcat 6 + jsp |
| | 46 | * 討論 目錄架構 |
| | 47 | |
| | 48 | * [http://trac.nchc.org.tw/cloud/export/124/nutchez-0.2/package/nutchez-0.2-20100524.tar.gz 下載修改後 nutch 叢集版 的壓縮檔] |
| | 49 | * 設定叢集驅動模式( /opt/nutchez/nutch/conf/ 的 hadoop-site.xml ) |
| | 50 | {{{ |
| | 51 | #!xml |
| | 52 | <configuration> |
| | 53 | <property> |
| | 54 | <name>fs.default.name</name> |
| | 55 | <value>hdfs://localhost:9000</value> |
| | 56 | </property> |
| | 57 | <property> |
| | 58 | <name>mapred.job.tracker</name> |
| | 59 | <value>localhost:9001</value> |
| | 60 | </property> |
| | 61 | <property> |
| | 62 | <name>hadoop.tmp.dir</name> |
| | 63 | <value>/var/nutchez/nutch-nutchuser</value> |
| | 64 | </property> |
| | 65 | </configuration> |
| | 66 | }}} |
| | 67 | * 設定 最後的搜尋結果 ( /opt/nutchez/tomcat/webapps/ROOT/WEB-INF/classes/ 的 nutch-site.xml ) |
| | 68 | {{{ |
| | 69 | #!xml |
| | 70 | <configuration> |
| | 71 | <property> |
| | 72 | <name>searcher.dir</name> |
| | 73 | <value>/home/nutchuser/nutchez/search</value> |
| | 74 | </property> |
| | 75 | </configuration> |
| | 76 | }}} |
| | 77 | * 使 nutch 主程式引入環境變數 (改 /opt/nutchez/nutch/bin/nutch ) |
| | 78 | {{{ |
| | 79 | #!sh |
| | 80 | NUTCH_HOME=/opt/nutchez/nutch |
| | 81 | NUTCH_CONF_DIR=/opt/nutchez/nutch/conf |
| | 82 | NUTCH_LOG_DIR=/var/nutchez/logs |
| | 83 | }}} |
| | 84 | * 叢集版的 nutch ,要使用之前,要先執行 hadoop format 與 start-all.sh |