1 /* SeedAcceptDecideRule
2 *
3 * $Id: SeedAcceptDecideRule.java 4649 2006-09-25 17:16:55Z paul_jack $
4 *
5 * Created on Sep 13, 2005
6 *
7 * Copyright (C) 2005 Internet Archive.
8 *
9 * This file is part of the Heritrix web crawler (crawler.archive.org).
10 *
11 * Heritrix is free software; you can redistribute it and/or modify
12 * it under the terms of the GNU Lesser Public License as published by
13 * the Free Software Foundation; either version 2.1 of the License, or
14 * any later version.
15 *
16 * Heritrix is distributed in the hope that it will be useful,
17 * but WITHOUT ANY WARRANTY; without even the implied warranty of
18 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19 * GNU Lesser Public License for more details.
20 *
21 * You should have received a copy of the GNU Lesser Public License
22 * along with Heritrix; if not, write to the Free Software
23 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
24 */
25 package org.archive.crawler.deciderules;
26
27 import org.archive.crawler.datamodel.CandidateURI;
28
29
30 /***
31 * Rule which ACCEPTs all 'seed' URIs (those for which
32 * isSeed is true). Good in a late position to ensure
33 * other scope settings don't lock out explicitly added
34 * seeds.
35 *
36 * @author gojomo
37 */
38 public class SeedAcceptDecideRule extends AcceptDecideRule {
39
40 private static final long serialVersionUID = 2167939872761313683L;
41
42 public SeedAcceptDecideRule(String name) {
43 super(name);
44 setDescription("SeedAcceptDecideRule. ACCEPTs " +
45 "all CrawlURIs that were explicitly added " +
46 "as seeds -- even if earlier scope rules " +
47 "rejected them.");
48 }
49
50 public Object decisionFor(Object object) {
51 try {
52 if (((CandidateURI)object).isSeed()) {
53 return ACCEPT;
54 }
55 } catch (ClassCastException e) {
56 // Do nothing
57 }
58 return PASS;
59 }
60 }