changeset 71:17eb428525cb

impose some limits
author Henry S. Thompson <ht@inf.ed.ac.uk>
date Tue, 28 Apr 2020 19:02:14 +0100
parents efa138bcb171
children f1bf3effa893
files src/nutch-cc/conf/nutch-site.xml
diffstat 1 files changed, 2 insertions(+), 2 deletions(-) [+]
line wrap: on
line diff
--- a/src/nutch-cc/conf/nutch-site.xml	Tue Apr 28 19:01:41 2020 +0100
+++ b/src/nutch-cc/conf/nutch-site.xml	Tue Apr 28 19:02:14 2020 +0100
@@ -5,14 +5,14 @@
 
 <configuration>
   <!-- from email from Sebastian 2020-04-16, ccrawl:57[01] -->
-  <property><name>http.content.limit</name><value>-1</value></property>
+  <property><name>http.content.limit</name><value>500000000</value></property>
   <property><name>http.store.responsetime</name><value>true</value></property>
   <property><name>store.ip.address</name><value>true</value></property>
   <property><name>store.http.request</name><value>true</value></property>
   <property><name>store.http.headers</name><value>true</value></property>
   <property><name>http.accept.language</name><value>en-US,en;q=0.5</value></property>
   <property><name>http.accept.charset</name><value> </value></property>
-  <property><name>http.time.limit</name><value>300</value></property>
+  <property><name>http.time.limit</name><value>600</value></property>
   <property><name>http.timeout</name><value>45000</value></property>
   <property><name>http.redirect.max</name><value>3</value></property>
   <property><name>http.redirect.max.skip</name><value>false</value></property>