blob: 5485892e6ac82219e26f3aec4b1a69d953710c02 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.nutch.crawl;
import java.io.DataInput;
import java.io.DataOutput;
import java.io.IOException;
import java.util.Map.Entry;
import org.apache.hadoop.io.MapWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.io.Writable;
/** An incoming link to a page. */
public class Inlink implements Writable {
private String fromUrl;
private String anchor;
private MapWritable md = null;
public Inlink() {
}
public Inlink(String fromUrl, String anchor) {
this.fromUrl = fromUrl;
this.anchor = anchor;
}
@Override
public void readFields(DataInput in) throws IOException {
fromUrl = Text.readString(in);
anchor = Text.readString(in);
boolean hasMD = in.readBoolean();
if (hasMD) {
md = new org.apache.hadoop.io.MapWritable();
md.readFields(in);
} else {
md = null;
}
}
/**
* Skips over one Inlink in the input.
* @param in the tuple containing the fromUrl and anchor data
* @throws IOException if there is an error reading the Inlink tuple
*/
public static void skip(DataInput in) throws IOException {
Text.skip(in); // skip fromUrl
Text.skip(in); // skip anchor
boolean hasMD = in.readBoolean();
if (hasMD) {
MapWritable metadata = new org.apache.hadoop.io.MapWritable();
metadata.readFields(in);
}
}
@Override
public void write(DataOutput out) throws IOException {
Text.writeString(out, fromUrl);
Text.writeString(out, anchor);
if (md != null && md.size() > 0) {
out.writeBoolean(true);
md.write(out);
} else {
out.writeBoolean(false);
}
}
public static Inlink read(DataInput in) throws IOException {
Inlink inlink = new Inlink();
inlink.readFields(in);
return inlink;
}
public String getFromUrl() {
return fromUrl;
}
public String getAnchor() {
return anchor;
}
public MapWritable getMetadata() {
return md;
}
public void setMetadata(MapWritable md) {
this.md = md;
}
@Override
public boolean equals(Object o) {
if (!(o instanceof Inlink))
return false;
Inlink other = (Inlink) o;
return this.fromUrl.equals(other.fromUrl)
&& this.anchor.equals(other.anchor);
}
@Override
public int hashCode() {
return fromUrl.hashCode() ^ anchor.hashCode();
}
@Override
public String toString() {
StringBuilder buffer = new StringBuilder();
if (md != null && !md.isEmpty()) {
for (Entry<Writable, Writable> e : md.entrySet()) {
buffer.append(" ");
buffer.append(e.getKey());
buffer.append(": ");
buffer.append(e.getValue());
}
}
return "fromUrl: " + fromUrl + " anchor: " + anchor + " metadata: " + buffer.toString();
}
}