Skip to content

Commit

Permalink
Merge pull request #12 from getwasim/master
Browse files Browse the repository at this point in the history
Formatting
  • Loading branch information
Arsen A. Gutsal committed Feb 7, 2014
2 parents 6e52e25 + c93f4a5 commit f30ea69
Showing 1 changed file with 22 additions and 24 deletions.
46 changes: 22 additions & 24 deletions grails-app/conf/Config.groovy
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ log4j = {
warn 'org.apache.camel'
trace 'gnutch'

//trace 'gnutch.indexer.DocumentIndexer.dom'
//trace 'gnutch.indexer.DocumentIndexer.dom'
}


Expand All @@ -24,16 +24,16 @@ environments {
'org.springframework',
'org.hibernate',
'net.sf.ehcache.hibernate'


warn 'org.apache.camel'
debug 'gnutch'

//trace 'gnutch.indexer.DocumentIndexer.dom'
//trace 'gnutch.indexer.DocumentIndexer.dom'
}

gnutch {
// Input route definition
// Input route definition
inputRoute = 'file:///home/archer/tmp/gnutch-input'

aggregationTime = 60000L
Expand All @@ -44,16 +44,16 @@ environments {
multiplier = 10
}
handlers {
// org.apache.camel.Processor definition. Called after HTML is transformed into XHTML
// org.apache.camel.Processor definition. Called after HTML is transformed into XHTML
// ex.in.body contains XHML document (actually contains reference to org.w3c.org.Document)
postHTTP = { Exchange ex ->

}
// org.apache.camel.Processor definition. Called after HTML is transformed into XHTML
// org.apache.camel.Processor definition. Called after HTML is transformed into XHTML
// ex.in.body contains XHML document (actually contains reference to org.w3c.org.Document)
postXHTML = { Exchange ex ->

}
}

// org.apache.camel.Processor definition. Called after XML is built
// ex.in.body contains XML document (actually contains reference to org.w3c.org.Document)
Expand All @@ -69,7 +69,7 @@ environments {
// aquiring `source` field
def nodeList = doc.getElementsByTagName("field")
def id = nodeList.find { it.getAttribute("name") == "id"}.textContent

def m = id =~ /https?:\/\/([^\/]*)\//
try{
def sourceElement = doc.createElement("field")
Expand Down Expand Up @@ -102,34 +102,32 @@ environments {
}

http {
// UserAgent string. Better if contain email address of person who is responsible
// UserAgent string. Better if contain email address of person who is responsible
// for crawling. That will allow source owners to contact person directly
userAgent = "GNutch crawler. Contact maintainer: [email protected]"
// Maximmum number of connections per host
defaultMaxConnectionsPerHost = 1000
// Maximmum number of total connections
maxTotalConnections = 1000
customHeaders = [
Cookie: 'PacerUser="mu023901391517923 66uziNFVAR."; PacerSession=4weby3qfsJY8BzLiG2bP8+6WpaY6iHw0yHus6YIiEtUC1o1rGgh4R5RhatqFWeKXVNTyt9Ak7Xlcqh80IUD+Hjy2btQCzWiG; PacerPref=receipt=Y'
]
customHeaders = []
}

solr {
coreUrl = 'http://92.52.145.2:8983/solr/collection1'
}

activemq {
// URL to message broker
brokerURL = 'vm://localhost'
// brokerURL = 'tcp://localhost:61616'
// conf = 'classpath:activemq.xml'
}
}
}
}

test {
gnutch {
// Input route definition
// Input route definition
inputRoute = 'file:///home/archer/tmp/gnutch-input'

aggregationTime = 10000L
Expand All @@ -141,17 +139,17 @@ environments {
}

handlers {
// org.apache.camel.Processor definition. Called after HTML is transformed into XHTML
// org.apache.camel.Processor definition. Called after HTML is transformed into XHTML
// ex.in.body contains XHML document (actually contains reference to org.w3c.org.Document)
postXHTML = { Exchange ex ->

}
}

// org.apache.camel.Processor definition. Called after XML is built
// ex.in.body contains XML document (actually contains reference to org.w3c.org.Document)
postXML = { Exchange ex ->

}
}

validate = { Exchange ex ->
return true
Expand All @@ -164,24 +162,24 @@ environments {
}

}

http {
// UserAgent string. Better if contain email address of person who is responsible
// UserAgent string. Better if contain email address of person who is responsible
// for crawling. That will allow source owners to contact person directly
userAgent = "GNutch crawler (https://github.com/softsky/gnutch): [email protected]"
// Maximmum number of connections per host
defaultMaxConnectionsPerHost = 1000
// Maximmum number of total connections
maxTotalConnections = 1000
}

activemq {
// URL to message broker
brokerURL = 'vm://localhost?broker.persistent=false'
// brokerURL = 'tcp://localhost:61616'
// conf = 'classpath:activemq.xml'
}
}
}

}
}

0 comments on commit f30ea69

Please sign in to comment.