Changeset 67


Ignore:
Timestamp:
May 21, 2009, 2:49:49 PM (15 years ago)
Author:
waue
Message:

v2

Location:
nutchez-0.1
Files:
7 added
1 deleted
6 edited

Legend:

Unmodified
Added
Removed
  • nutchez-0.1/bin/nutchez

    r66 r67  
    88
    99. ./nutchez-func.sh
     10
    1011# root ?
    1112#check_if_root
    1213
    1314# show url lists
     15
     16setup_nutchez
     17
    1418CHECK=0
    1519while [ $CHECK -eq 0 ]; do
  • nutchez-0.1/bin/nutchez-func.sh

    r66 r67  
    55# .
    66
    7 . $NUTCHEZ_SCRIPT_PATH/conf/hadoop-env.sh
    8 
    9 VERB=1
     7. /etc/nutch/hadoop-env.sh || . $NUTCHEZ_SCRIPT_PATH/conf/hadoop-env.sh
    108
    119: ${DIALOG=dialog}
    1210
    13 #NEZ_DIR=/home/waue/.nutchez
    14 #NEZ_DIR_URL
    15 #NEZ_DIR_OTHER
     11VERB=0
    1612
    1713
     
    5349}
    5450
     51setup_nutchez() {
     52  if ! [ -e ~/.nutchez ] ;then
     53    cp -rf /etc/nutch/.nutchez ~/
     54    chown -R $LOGNAME:$LOGNAME ~/.nutchez
     55    if [ -e /tmp/nutch ] ;then
     56      rm -rf /tmp/nutch
     57    fi
     58    mkdir /tmp/nutch
     59    ln -sf ~/.nutchez/search /tmp/nutch/
    5560
     61  fi
     62}
    5663
    5764show_urls (){
     
    98105  echo " \n 2. The robot name is : \n" >> $tempfile
    99106  cat /tmp/n.robot.tmp >> $tempfile
    100   echo " \n 3. The crawled dipth is : \n " >> $tempfile
     107  echo " \n 3. The crawled depth is : \n " >> $tempfile
    101108  cat /tmp/n.crawler.tmp >> $tempfile
    102109  echo " \n 4. The explorer port is : \n " >> $tempfile
     
    113120}
    114121
     122# define paramaters
     123ROBOT=`cat /tmp/n.url.txt`
     124URLS=`cat /tmp/n.url.txt`
     125DEPTH=`cat /tmp/n.url.txt`
     126PORT=`cat /tmp/n.url.txt`
     127
    115128start_crawl () {
    116129  echo_vb "7. start_crawl"
     130  setup_nutch
     131  /opt/nutch/bin/nutch crawl ~/.nutch/urls -dir ~/.nutch/search -threads 2 -depth $DEPTH
    117132}
    118133
    119134start_tomcat () {
    120135  echo_vb "8. start_tomcat "
     136  /opt/nutch/tomcat/bin/startup.sh
    121137}
    122138
  • nutchez-0.1/build.xml

    r66 r67  
    1414 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    1515 See the License for the specific language governing permissions and
    16  limitations under the License.
     16 limitations under this License.
    1717-->
    1818<project name="Nutch" default="job">
  • nutchez-0.1/debian/nutchez.install

    r66 r67  
    11conf/*    etc/nutch
    22bin   opt/nutch
     3bin/nutchez*  usr/local/sbin
    34lib   opt/nutch
    45webapps   opt/nutch
  • nutchez-0.1/debian/nutchez.postrm

    r66 r67  
    1717    rm -rf /tmp/hadoop*
    1818    rm -rf /tmp/hsperfdata*
     19    rm /usr/local/sbin/nutchez*
    1920  fi
    2021}
  • nutchez-0.1/tomcat/webapps/ROOT/WEB-INF/classes/nutch-site.xml

    r66 r67  
    66    <property>
    77        <name>searcher.dir</name>
    8         <value>/opt/nutch/search</value>
     8        <value>/tmp/nutch/search</value>
    99    </property>
    1010</configuration>
Note: See TracChangeset for help on using the changeset viewer.