<map>
<entry>
<string>plugin_cache_result_list</string>
<list>
<string>404=org.lockss.util.urlconn.CacheException$NoRetryDeadLinkException</string>
</list>
</entry>
<entry>
<string>plugin_version</string>
<string>2</string>
</entry>
<entry>
<string>plugin_config_props</string>
<list>
<org.lockss.daemon.ConfigParamDescr>
<key>base_url</key>
<displayName>Base URL</displayName>
<description>Usually of the form http://<journal-name>.com/</description>
<type>3</type>
<size>40</size>
<definitional>true</definitional>
<defaultOnly>false</defaultOnly>
</org.lockss.daemon.ConfigParamDescr>
<org.lockss.daemon.ConfigParamDescr>
<key>from</key>
<displayName>From</displayName>
<description>String indicating the subest of etds, often indicating year/date range </description>
<type>1</type>
<size>40</size>
<definitional>true</definitional>
<defaultOnly>false</defaultOnly>
</org.lockss.daemon.ConfigParamDescr>
</list>
</entry>
<entry>
<string>au_name</string>
<string>"PUC RIO Etds %s ...", from</string>
</entry>
<entry>
<string>au_crawl_depth</string>
<int>3</int>
</entry>
<entry>
<string>au_start_url</string>
<string>"%s:8001/MetaArchive/manifest.html", base_url</string>
</entry>
<entry>
<string>au_def_new_content_crawl</string>
<long>2592000000</long>
</entry>
<entry>
<string>au_def_pause_time</string>
<long>6000</long>
</entry>
<entry>
<string>plugin_name</string>
<string>PUC RIO etds </string>
</entry>
<entry>
<string>plugin_notes</string>
<string>This plugin harvests all *.PDF, *.xml, *.xsl file it encounters during its crawl </string>
</entry>
<entry>
<string>plugin_identifier</string>
<string>br.pucrio.etds</string>
</entry>
<entry>
<string>au_crawlrules</string>
<list>
<string>4,"^%s", base_url</string>
<string>1,"^%s:8001/MetaArchive/manifest.html$", base_url</string>
<string>1,"^%s:8081/MetaArchive/transform$", base_url</string>
<string>1,"^%s:8081/MetaArchive/transform.php?dcxml=%s-.*/*.xml", base_url, from</string>
<string>1,"%s-.*/.*.xml", from</string>
<string>1,"^%s:8001/.*.XSL$", base_url</string>
<string>1,"^%s:8001/.*.xsl$", base_url</string>
<string>1,"^%s:8001/.*.PDF$", base_url</string>
<string>1,"^%s:8001/.*.pdf$", base_url</string>
</list>
</entry>
</map>
Parameter Values |
Status |
Copies |
|
(Loading) |