Ignore:
Timestamp:
May 21, 2009, 2:49:49 PM (15 years ago)
Author:
waue
Message:

v2

File:
1 edited

Legend:

Unmodified
Added
Removed
  • nutchez-0.1/bin/nutchez-func.sh

    r66 r67  
    55# .
    66
    7 . $NUTCHEZ_SCRIPT_PATH/conf/hadoop-env.sh
    8 
    9 VERB=1
     7. /etc/nutch/hadoop-env.sh || . $NUTCHEZ_SCRIPT_PATH/conf/hadoop-env.sh
    108
    119: ${DIALOG=dialog}
    1210
    13 #NEZ_DIR=/home/waue/.nutchez
    14 #NEZ_DIR_URL
    15 #NEZ_DIR_OTHER
     11VERB=0
    1612
    1713
     
    5349}
    5450
     51setup_nutchez() {
     52  if ! [ -e ~/.nutchez ] ;then
     53    cp -rf /etc/nutch/.nutchez ~/
     54    chown -R $LOGNAME:$LOGNAME ~/.nutchez
     55    if [ -e /tmp/nutch ] ;then
     56      rm -rf /tmp/nutch
     57    fi
     58    mkdir /tmp/nutch
     59    ln -sf ~/.nutchez/search /tmp/nutch/
    5560
     61  fi
     62}
    5663
    5764show_urls (){
     
    98105  echo " \n 2. The robot name is : \n" >> $tempfile
    99106  cat /tmp/n.robot.tmp >> $tempfile
    100   echo " \n 3. The crawled dipth is : \n " >> $tempfile
     107  echo " \n 3. The crawled depth is : \n " >> $tempfile
    101108  cat /tmp/n.crawler.tmp >> $tempfile
    102109  echo " \n 4. The explorer port is : \n " >> $tempfile
     
    113120}
    114121
     122# define paramaters
     123ROBOT=`cat /tmp/n.url.txt`
     124URLS=`cat /tmp/n.url.txt`
     125DEPTH=`cat /tmp/n.url.txt`
     126PORT=`cat /tmp/n.url.txt`
     127
    115128start_crawl () {
    116129  echo_vb "7. start_crawl"
     130  setup_nutch
     131  /opt/nutch/bin/nutch crawl ~/.nutch/urls -dir ~/.nutch/search -threads 2 -depth $DEPTH
    117132}
    118133
    119134start_tomcat () {
    120135  echo_vb "8. start_tomcat "
     136  /opt/nutch/tomcat/bin/startup.sh
    121137}
    122138
Note: See TracChangeset for help on using the changeset viewer.