Context Navigation

← Previous Changeset
Next Changeset →

Changeset 7658

Timestamp:

2004-06-29T14:54:18+12:00 (20 years ago)

Author:

kjdon

Message:

renamed collection/Job to collection/DownloadJob. also fixed a bug in the download process. previously we were giving the full path to wget as a prefix - this causes a bug if we try to redownload the same site again because internal links get converted to full paths. instead, we run the process in a particular directory, so wget doesn't get given a prefix and just puts things in the current workign directory with relative urls

Location:

trunk/gli/src/org/greenstone/gatherer

Files:

: 1 added
: 1 deleted
: 1 edited

Legend:

: Unmodified
: Added
: Removed

trunk/gli/src/org/greenstone/gatherer/WGet.java

-              r6770
+              r7658
 import javax.swing.tree.*;
 import org.greenstone.gatherer.Gatherer;
 import org.greenstone.gatherer.collection.Job;
+import org.greenstone.gatherer.collection.DownloadJob;
 /** This class provides access to the functionality of the WGet program, either by calling it via a shell script or by the JNI. It maintains a queue of pending jobs, and the component for showing these tasks to the user.
 …
     private JPanel list_pane;
     /** The job currently underway. */
     private Job job;
+    private DownloadJob job;
     /** A scroll pane which will be used to display the list of pending tasks. */
     private JScrollPane list_scroll;
 …
     /** Called by the WGet native code to inform us of a new download starting within the given job.
      * @param url The url that is being downloaded, as a <strong>String</strong>.
      * @see org.greenstone.gatherer.collection.Job
+     * @see org.greenstone.gatherer.collection.DownloadJob
      */
     public synchronized void addDownload(String url) {
 …
+    }
     /* Used to advise the Job of a newly parsed link. Its up to Job to decide if it already knows about this url, and if not to update its progress bar.
+    /* Used to advise the DownloadJob of a newly parsed link. Its up to DownloadJob to decide if it already knows about this url, and if not to update its progress bar.
      * @param url The url in question as a <strong>String</strong>.
      * @param type <i>true</i> if this is an internal link, <i>false</i> for and external one.
      * @return A <i>boolean</i> with a value of <i>true</i> indicating if the url was added, <i>false</i> otherwise.
      * @see org.greenstone.gatherer.collection.Job
+     * @see org.greenstone.gatherer.collection.DownloadJob
      */
     public synchronized boolean addLink(String url, int type) {
 …
      * wait until the native job has cleanly exited before removing
      * the job.
      * @param delete_me The <strong>Job</strong> that is to be deleted.
      */
     public void deleteJob(Job delete_me) {
+     * @param delete_me The <strong>DownloadJob</strong> that is to be deleted.
+     */
+    public void deleteDownloadJob(DownloadJob delete_me) {
     if (delete_me == job) {
         // While this seems wasteful its only for the briefest moment.
 …
      * for the indicated job, is completed. In turn all download
      * listeners are informed.
      * @see org.greenstone.gatherer.collection.Job
+     * @see org.greenstone.gatherer.collection.DownloadJob
      */
     public synchronized void downloadComplete() {
 …
      * a status code other than 200-399 for the specified download job.
      * for.
      * @see org.greenstone.gatherer.collection.Job
+     * @see org.greenstone.gatherer.collection.DownloadJob
      */
     public synchronized void downloadFailed() {
 …
      * be downloaded as doing so would clobber an existing file and the -nc
      * flag is set.
      * @see org.greenstone.gatherer.collection.Job
+     * @see org.greenstone.gatherer.collection.DownloadJob
      */
     public synchronized void downloadWarning() {
 …
      * scroll pane containing the current list of jobs.
      */
     public JScrollPane getJobList() {
+    public JScrollPane getDownloadJobList() {
     return list_scroll;
+    }
 …
      * @return A boolean representing whether the user has requested to
      * stop.
      * @see org.greenstone.gatherer.collection.Job
+     * @see org.greenstone.gatherer.collection.DownloadJob
      */
     public synchronized boolean hasSignalledStop() {
 …
      * @see org.greenstone.gatherer.Configuration
      * @see org.greenstone.gatherer.Gatherer
      * @see org.greenstone.gatherer.collection.Job
      * @see org.greenstone.gatherer.gui.GProgressBar
+     * @see org.greenstone.gatherer.collection.DownloadJob
+     * @see org.greenstone.gatherer.gui.DownloadProgressBar
      * @see org.greenstone.gatherer.util.GURL
      */
     public void newJob(boolean no_parents, boolean other_hosts, boolean page_requisites, URL url, int depth, String destination) {
+    public void newDownloadJob(boolean no_parents, boolean other_hosts, boolean page_requisites, URL url, int depth, String destination) {
     // Create the job and fill in the details from gatherer.config.
     Gatherer.println("About to create a new job");
+    // If it was decided not to download page requisites, then create the destination by basing it on the given destination, but appending the url host and paths. If page requisites is used then WGet will do this for us
+    if(!page_requisites && depth == 0) {
+        Gatherer.println("Initially destination: " + destination);
+        String almost_the_entire_path = url.getPath();
+        int index = -1;
+        if((index = almost_the_entire_path.lastIndexOf("/")) != -1) {
+        almost_the_entire_path = almost_the_entire_path.substring(0, index);
+        }
+        destination = destination + url.getHost() + almost_the_entire_path;
+        Gatherer.println("Final destination:    " + destination);
+    }
+    Job new_job = new Job(Gatherer.config.get("mirroring.debug", false), no_parents, other_hosts, page_requisites, Gatherer.config.get("mirroring.quiet", false), url, depth, destination, Gatherer.config.proxy_pass, Gatherer.config.proxy_user, this, simple);
+    DownloadJob new_job = new DownloadJob(Gatherer.config.get("mirroring.debug", false), no_parents, other_hosts, page_requisites, Gatherer.config.get("mirroring.quiet", false), url, depth, destination, Gatherer.config.proxy_pass, Gatherer.config.proxy_user, this, simple);
     // Tell it to run as soon as possible
     new_job.setState(Job.RUNNING);
+    new_job.setState(DownloadJob.RUNNING);
     // Add to job_queue job list.
 …
      * @param expected A long representing the total number of bytes
      * expected for this download.
      * @see org.greenstone.gatherer.collection.Job
+     * @see org.greenstone.gatherer.collection.DownloadJob
      */
     public synchronized void updateProgress(long current, long expected) {
 …
      * waiting list.
      * @see org.greenstone.gatherer.Gatherer
      * @see org.greenstone.gatherer.collection.Job
+     * @see org.greenstone.gatherer.collection.DownloadJob
      */
     public void run() {
 …
         while(job_queue.size() > 0 && index < job_queue.size()) {
             // Get the first job that isn't stopped.
             job = (Job) job_queue.get(index);
             if(job.getState() == Job.RUNNING) {
             Gatherer.println("Job " + job.toString() + " Begun.");
+            job = (DownloadJob) job_queue.get(index);
+            if(job.getState() == DownloadJob.RUNNING) {
+            Gatherer.println("DownloadJob " + job.toString() + " Begun.");
             // A lock to prevent us deleting this job while its being
             // run, unless you want things to go really wrong.
 …
+            }
             busy = false;
             Gatherer.println("Job " + job.toString() + " complete.");
+            Gatherer.println("DownloadJob " + job.toString() + " complete.");
             // And if the user has requested that complete jobs
                 // be removed, then remove it from the list.
             //deleteJob(job);
+            //deleteDownloadJob(job);
             job = null;
+            }
 …
         try {
             synchronized(this) {
             Gatherer.println("WGet thread is waiting for Jobs.");
+            Gatherer.println("WGet thread is waiting for DownloadJobs.");
             wait();
+            }

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changeset 7658

Legend:

trunk/gli/src/org/greenstone/gatherer/WGet.java

Download in other formats: