| <?xml version="1.0" encoding="UTF-8"?> |
| <!-- |
| Licensed to the Apache Software Foundation (ASF) under one or more |
| contributor license agreements. See the NOTICE file distributed with |
| this work for additional information regarding copyright ownership. |
| The ASF licenses this file to You under the Apache License, Version 2.0 |
| (the "License"); you may not use this file except in compliance with |
| the License. You may obtain a copy of the License at |
| |
| http://www.apache.org/licenses/LICENSE-2.0 |
| |
| Unless required by applicable law or agreed to in writing, software |
| distributed under the License is distributed on an "AS IS" BASIS, |
| WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| See the License for the specific language governing permissions and |
| limitations under the License. |
| --> |
| <gora-orm> |
| |
| <class name="org.apache.nutch.storage.WebPage" keyClass="java.lang.String" table="webpage"> |
| <primarykey column="id" length="512"/> |
| <field name="baseUrl" column="baseUrl" length="512"/> |
| <field name="status" column="status"/> |
| <field name="prevFetchTime" column="prevFetchTime"/> |
| <field name="fetchTime" column="fetchTime"/> |
| <field name="fetchInterval" column="fetchInterval"/> |
| <field name="retriesSinceFetch" column="retriesSinceFetch"/> |
| <field name="reprUrl" column="reprUrl" length="512"/> |
| <field name="content" column="content" length="65536"/> |
| <field name="contentType" column="typ" length="32"/> |
| <field name="protocolStatus" column="protocolStatus"/> |
| <field name="modifiedTime" column="modifiedTime"/> |
| <field name="prevModifiedTime" column="prevModifiedTime"/> |
| <field name="batchId" column="batchId" length="32"/> |
| |
| <!-- parse fields --> |
| <field name="title" column="title" length="512"/> |
| <field name="text" column="text" length="32000"/> |
| <field name="parseStatus" column="parseStatus"/> |
| <field name="signature" column="signature"/> |
| <field name="prevSignature" column="prevSignature"/> |
| |
| <!-- score fields --> |
| <field name="score" column="score"/> |
| <field name="headers" column="headers"/> |
| <field name="inlinks" column="inlinks"/> |
| <field name="outlinks" column="outlinks"/> |
| <field name="metadata" column="metadata"/> |
| <field name="markers" column="markers"/> |
| </class> |
| |
| <class name="org.apache.nutch.storage.Host" keyClass="java.lang.String" |
| table="host"> |
| <primarykey column="id" length="512"/> |
| <field name="metadata" column="metadata"/> |
| <field name="inlinks" column="inlinks"/> |
| <field name="outlinks" column="outlinks"/> |
| </class> |
| |
| </gora-orm> |