| 1 | <?xml version="1.0" encoding="UTF-8"?> | 
|---|
| 2 | <!-- | 
|---|
| 3 | Licensed to the Apache Software Foundation (ASF) under one or more | 
|---|
| 4 | contributor license agreements.  See the NOTICE file distributed with | 
|---|
| 5 | this work for additional information regarding copyright ownership. | 
|---|
| 6 | The ASF licenses this file to You under the Apache License, Version 2.0 | 
|---|
| 7 | (the "License"); you may not use this file except in compliance with | 
|---|
| 8 | the License.  You may obtain a copy of the License at | 
|---|
| 9 |  | 
|---|
| 10 | http://www.apache.org/licenses/LICENSE-2.0 | 
|---|
| 11 |  | 
|---|
| 12 | Unless required by applicable law or agreed to in writing, software | 
|---|
| 13 | distributed under the License is distributed on an "AS IS" BASIS, | 
|---|
| 14 | WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
|---|
| 15 | See the License for the specific language governing permissions and | 
|---|
| 16 | limitations under the License. | 
|---|
| 17 | --> | 
|---|
| 18 | <plugin | 
|---|
| 19 | id="parse-oo" | 
|---|
| 20 | name="OpenOffice/OpenDocument Parse Plug-in" | 
|---|
| 21 | version="1.0.0" | 
|---|
| 22 | provider-name="nutch.org"> | 
|---|
| 23 |  | 
|---|
| 24 |  | 
|---|
| 25 | <runtime> | 
|---|
| 26 | <library name="parse-oo.jar"> | 
|---|
| 27 | <export name="*"/> | 
|---|
| 28 | </library> | 
|---|
| 29 | </runtime> | 
|---|
| 30 |  | 
|---|
| 31 | <requires> | 
|---|
| 32 | <import plugin="nutch-extensionpoints"/> | 
|---|
| 33 | <import plugin="lib-xml"/> | 
|---|
| 34 | </requires> | 
|---|
| 35 |  | 
|---|
| 36 | <extension id="org.apache.nutch.parse.oo" | 
|---|
| 37 | name="OOParse" | 
|---|
| 38 | point="org.apache.nutch.parse.Parser"> | 
|---|
| 39 |  | 
|---|
| 40 | <!-- Text / Writer --> | 
|---|
| 41 | <implementation id="org.apache.nutch.parse.oo.OpenDocument.Text" | 
|---|
| 42 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 43 | <parameter name="contentType" value="application/vnd.oasis.opendocument.text"/> | 
|---|
| 44 | <parameter name="pathSuffix"  value="odt"/> | 
|---|
| 45 | </implementation> | 
|---|
| 46 |  | 
|---|
| 47 | <implementation id="org.apache.nutch.parse.oo.StarOffice.Writer" | 
|---|
| 48 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 49 | <parameter name="contentType" value="application/vnd.sun.xml.writer"/> | 
|---|
| 50 | <parameter name="pathSuffix"  value="sxw"/> | 
|---|
| 51 | </implementation> | 
|---|
| 52 |  | 
|---|
| 53 | <!-- Text / Writer Template --> | 
|---|
| 54 | <implementation id="org.apache.nutch.parse.oo.OpenDocument.TextTemplate" | 
|---|
| 55 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 56 | <parameter name="contentType" value="application/vnd.oasis.opendocument.text-template"/> | 
|---|
| 57 | <parameter name="pathSuffix"  value="ott"/> | 
|---|
| 58 | </implementation> | 
|---|
| 59 |  | 
|---|
| 60 | <implementation id="org.apache.nutch.parse.oo.StarOffice.WriterTemplate" | 
|---|
| 61 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 62 | <parameter name="contentType" value="application/vnd.sun.xml.writer.template"/> | 
|---|
| 63 | <parameter name="pathSuffix"  value="stw"/> | 
|---|
| 64 | </implementation> | 
|---|
| 65 |  | 
|---|
| 66 | <!-- Text-Web --> | 
|---|
| 67 | <implementation id="org.apache.nutch.parse.oo.OpenDocument.TextWeb" | 
|---|
| 68 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 69 | <parameter name="contentType" value="application/vnd.oasis.opendocument.text-web"/> | 
|---|
| 70 | <parameter name="pathSuffix"  value="odh"/> | 
|---|
| 71 | </implementation> | 
|---|
| 72 |  | 
|---|
| 73 | <!-- Text-Master --> | 
|---|
| 74 | <implementation id="org.apache.nutch.parse.oo.OpenDocument.TextMaster" | 
|---|
| 75 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 76 | <parameter name="contentType" value="application/vnd.oasis.opendocument.text-master"/> | 
|---|
| 77 | <parameter name="pathSuffix"  value="odm"/> | 
|---|
| 78 | </implementation> | 
|---|
| 79 |  | 
|---|
| 80 | <!-- Spreadsheet / Calc --> | 
|---|
| 81 | <implementation id="org.apache.nutch.parse.oo.OpenDocument.Spreadsheet" | 
|---|
| 82 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 83 | <parameter name="contentType" value="application/vnd.oasis.opendocument.spreadsheet"/> | 
|---|
| 84 | <parameter name="pathSuffix"  value="ods"/> | 
|---|
| 85 | </implementation> | 
|---|
| 86 |  | 
|---|
| 87 | <implementation id="org.apache.nutch.parse.oo.StarOffice.Calc" | 
|---|
| 88 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 89 | <parameter name="contentType" value="application/vnd.sun.xml.calc"/> | 
|---|
| 90 | <parameter name="pathSuffix"  value="sxc"/> | 
|---|
| 91 | </implementation> | 
|---|
| 92 |  | 
|---|
| 93 | <!-- Spreadsheet / Calc Template --> | 
|---|
| 94 | <implementation id="org.apache.nutch.parse.oo.OpenDocument.SpreadsheetTemplate" | 
|---|
| 95 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 96 | <parameter name="contentType" value="application/vnd.oasis.opendocument.spreadsheet-template"/> | 
|---|
| 97 | <parameter name="pathSuffix"  value="ots"/> | 
|---|
| 98 | </implementation> | 
|---|
| 99 |  | 
|---|
| 100 | <implementation id="org.apache.nutch.parse.oo.StarOffice.CalcTemplate" | 
|---|
| 101 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 102 | <parameter name="contentType" value="application/vnd.sun.xml.calc.template"/> | 
|---|
| 103 | <parameter name="pathSuffix"  value="stc"/> | 
|---|
| 104 | </implementation> | 
|---|
| 105 |  | 
|---|
| 106 | <!-- Presentation / Impress --> | 
|---|
| 107 | <implementation id="org.apache.nutch.parse.oo.OpenDocument.Presentation" | 
|---|
| 108 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 109 | <parameter name="contentType" value="application/vnd.oasis.opendocument.presentation"/> | 
|---|
| 110 | <parameter name="pathSuffix"  value="odp"/> | 
|---|
| 111 | </implementation> | 
|---|
| 112 |  | 
|---|
| 113 | <implementation id="org.apache.nutch.parse.oo.StarOffice.Impress" | 
|---|
| 114 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 115 | <parameter name="contentType" value="application/vnd.sun.xml.impress"/> | 
|---|
| 116 | <parameter name="pathSuffix"  value="sxi"/> | 
|---|
| 117 | </implementation> | 
|---|
| 118 |  | 
|---|
| 119 | <!-- Presentation / Impress Template --> | 
|---|
| 120 | <implementation id="org.apache.nutch.parse.oo.OpenDocument.PresentationTemplate" | 
|---|
| 121 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 122 | <parameter name="contentType" value="application/vnd.oasis.opendocument.presentation-template"/> | 
|---|
| 123 | <parameter name="pathSuffix"  value="otp"/> | 
|---|
| 124 | </implementation> | 
|---|
| 125 |  | 
|---|
| 126 | <implementation id="org.apache.nutch.parse.oo.StarOffice.ImpressTemplate" | 
|---|
| 127 | class="org.apache.nutch.parse.oo.OOParser"> | 
|---|
| 128 | <parameter name="contentType" value="application/vnd.sun.xml.impress.template"/> | 
|---|
| 129 | <parameter name="pathSuffix"  value="sti"/> | 
|---|
| 130 | </implementation> | 
|---|
| 131 |  | 
|---|
| 132 | </extension> | 
|---|
| 133 |  | 
|---|
| 134 | </plugin> | 
|---|