1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23 package org.archive.crawler.processor.recrawl;
24
25
26 import java.util.Iterator;
27
28 import org.archive.crawler.datamodel.CrawlURI;
29
30 import st.ata.util.AList;
31
32 /***
33 * Store CrawlURI attributes from latest fetch to persistent storage for
34 * consultation by a later recrawl.
35 *
36 * @author gojomo
37 * @version $Date: 2006-09-25 20:19:54 +0000 (Mon, 25 Sep 2006) $, $Revision: 4654 $
38 */
39 public class PersistLoadProcessor extends PersistOnlineProcessor {
40 private static final long serialVersionUID = -1917169316015093131L;
41
42 /***
43 * Usual constructor
44 *
45 * @param name
46 */
47 public PersistLoadProcessor(String name) {
48 super(name, "PersistLoadProcessor. Loads CrawlURI attributes " +
49 "from a previous crawl for current consultation.");
50 }
51
52 @Override
53 protected void innerProcess(CrawlURI curi) throws InterruptedException {
54 if(shouldLoad(curi)) {
55 AList prior = (AList) store.get(persistKeyFor(curi));
56 if(prior!=null) {
57
58 Iterator iter = prior.getKeys();
59 curi.getAList().copyKeysFrom(iter,prior);
60 }
61 }
62 }
63 }