I'd use a Switch Javascript to retrieve the remote document via wget command.
// HTTPget - retrieve file from remote web server
//
// Developed by Dwight Kelly <
dkelly@apago.com>
// Copyright 2011 - Apago, Inc. -- All rights reserved
//
function jobArrived( s : Switch, job : Job )
{
// get filename to retreive
var String theURI = s.getPropertyValue("URI", job);
if (theURI.length == 0) {
job.fail("HTTPget: No URI specified!");
}
// create output file path
var slashPos = theURI.lastIndexOf( "/" );
var String outName = job.createPathWithName( theURI.substring( slashPos+1, theURI.length) );
var String args = new Array();
args[0] = "/opt/local/bin/wget";
args[1] = theURI;
args[2] = "-o";
args[3] = outName;
var myProc = new Process(args);
myProc.start();
myProc.waitForFinished(60);
if (myProc.exitStatus == 0) {
// success
job.sendToSingle(outName);
return;
}
job.fail("HTTPget failed!");
}