Changeset 67
- Timestamp:
- May 21, 2009, 2:49:49 PM (16 years ago)
- Location:
- nutchez-0.1
- Files:
-
- 7 added
- 1 deleted
- 6 edited
Legend:
- Unmodified
- Added
- Removed
-
nutchez-0.1/bin/nutchez
r66 r67 8 8 9 9 . ./nutchez-func.sh 10 10 11 # root ? 11 12 #check_if_root 12 13 13 14 # show url lists 15 16 setup_nutchez 17 14 18 CHECK=0 15 19 while [ $CHECK -eq 0 ]; do -
nutchez-0.1/bin/nutchez-func.sh
r66 r67 5 5 # . 6 6 7 . $NUTCHEZ_SCRIPT_PATH/conf/hadoop-env.sh 8 9 VERB=1 7 . /etc/nutch/hadoop-env.sh || . $NUTCHEZ_SCRIPT_PATH/conf/hadoop-env.sh 10 8 11 9 : ${DIALOG=dialog} 12 10 13 #NEZ_DIR=/home/waue/.nutchez 14 #NEZ_DIR_URL 15 #NEZ_DIR_OTHER 11 VERB=0 16 12 17 13 … … 53 49 } 54 50 51 setup_nutchez() { 52 if ! [ -e ~/.nutchez ] ;then 53 cp -rf /etc/nutch/.nutchez ~/ 54 chown -R $LOGNAME:$LOGNAME ~/.nutchez 55 if [ -e /tmp/nutch ] ;then 56 rm -rf /tmp/nutch 57 fi 58 mkdir /tmp/nutch 59 ln -sf ~/.nutchez/search /tmp/nutch/ 55 60 61 fi 62 } 56 63 57 64 show_urls (){ … … 98 105 echo " \n 2. The robot name is : \n" >> $tempfile 99 106 cat /tmp/n.robot.tmp >> $tempfile 100 echo " \n 3. The crawled d ipth is : \n " >> $tempfile107 echo " \n 3. The crawled depth is : \n " >> $tempfile 101 108 cat /tmp/n.crawler.tmp >> $tempfile 102 109 echo " \n 4. The explorer port is : \n " >> $tempfile … … 113 120 } 114 121 122 # define paramaters 123 ROBOT=`cat /tmp/n.url.txt` 124 URLS=`cat /tmp/n.url.txt` 125 DEPTH=`cat /tmp/n.url.txt` 126 PORT=`cat /tmp/n.url.txt` 127 115 128 start_crawl () { 116 129 echo_vb "7. start_crawl" 130 setup_nutch 131 /opt/nutch/bin/nutch crawl ~/.nutch/urls -dir ~/.nutch/search -threads 2 -depth $DEPTH 117 132 } 118 133 119 134 start_tomcat () { 120 135 echo_vb "8. start_tomcat " 136 /opt/nutch/tomcat/bin/startup.sh 121 137 } 122 138 -
nutchez-0.1/build.xml
r66 r67 14 14 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 15 15 See the License for the specific language governing permissions and 16 limitations under th eLicense.16 limitations under this License. 17 17 --> 18 18 <project name="Nutch" default="job"> -
nutchez-0.1/debian/nutchez.install
r66 r67 1 1 conf/* etc/nutch 2 2 bin opt/nutch 3 bin/nutchez* usr/local/sbin 3 4 lib opt/nutch 4 5 webapps opt/nutch -
nutchez-0.1/debian/nutchez.postrm
r66 r67 17 17 rm -rf /tmp/hadoop* 18 18 rm -rf /tmp/hsperfdata* 19 rm /usr/local/sbin/nutchez* 19 20 fi 20 21 } -
nutchez-0.1/tomcat/webapps/ROOT/WEB-INF/classes/nutch-site.xml
r66 r67 6 6 <property> 7 7 <name>searcher.dir</name> 8 <value>/ opt/nutch/search</value>8 <value>/tmp/nutch/search</value> 9 9 </property> 10 10 </configuration>
Note: See TracChangeset
for help on using the changeset viewer.