Changes between Version 5 and Version 6 of waue/2011/0727


Ignore:
Timestamp:
Jul 27, 2011, 5:00:35 PM (13 years ago)
Author:
waue
Comment:

--

Legend:

Unmodified
Added
Removed
Modified
  • waue/2011/0727

    v5 v6  
    4646{{{
    4747#!text
     48<configuration>
    4849<property>
    4950  <name>http.agent.name</name>
    5051  <value>waue_test</value>
    5152</property>
     53<property>
     54  <name>plugin.includes</name>
     55  <value>protocol-http|urlfilter-regex|parse-(html|tika)|index-(basic|anchor)|scoring-opic|urlnormalizer-(pass|regex|basic)</value>
     56</property>
     57<property>
     58  <name>http.robots.agents</name>
     59  <value>nutch</value>
     60</property>
     61<property>
     62  <name>http.agent.url</name>
     63  <value>waue_test</value>
     64</property>
     65<property>
     66  <name>http.agent.email</name>
     67  <value>waue_test</value>
     68</property>
     69<property>
     70  <name>http.agent.version</name>
     71  <value>waue_test</value>
     72</property>
     73</configuration>
    5274}}}
    5375
     
    7496
    7597{{{
    76 echo "http://lucene.apache.org/nutch/" >urls/url.txt
     98mkdir urls ; echo "http://lucene.apache.org/nutch/" >urls/url.txt
    7799bin/nutch crawl urls -dir crawl2 -depth 2 -topN 50
    78100}}}