Changeset 11507 for trunk


Ignore:
Timestamp:
2006-03-28T11:35:50+12:00 (18 years ago)
Author:
shaoqun
Message:

add new parameter for wget that specifies which file extenstions should be accepted

File:
1 edited

Legend:

Unmodified
Added
Removed
  • trunk/gli/src/org/greenstone/gatherer/collection/DownloadJob.java

    r10342 r11507  
    185185     */
    186186    public boolean addLink(String raw_url, int type) {
    187     ///ystem.out.println("addLink("+url+", "+type+")");
     187    ///System.out.println("addLink("+url+", "+type+")");
    188188    if(!encountered_urls.contains(raw_url)) {
    189189        // Add it to the urls we've seen.
     
    256256        }
    257257    }
     258
     259
     260     
    258261       
    259262    // The user can choose to mirror all of the page requisites...
     
    261264        command = command + "-p ";
    262265    }
     266    else{ //or only HTML page (ignore associated files e.g images, stylesheets)
     267        command = command + "-A " + ".html,.htm,.shm,.shtml,.asp,.php,.cgi,*?*=* ";
     268    }
    263269
    264270    // Download files from other hosts
     
    282288    }
    283289    // Run it
     290     
     291        //System.out.println("***"+command);
    284292    try {
    285293        //DebugStream.println("Cmd: " + command); // don't print it out cos it may have the password in it
     
    543551     */
    544552    public boolean hasSignalledStop() {
    545     if(state == DownloadJob.STOPPED || state == DownloadJob.PAUSED ||
     553        if(state == DownloadJob.STOPPED || state == DownloadJob.PAUSED ||
    546554       state == DownloadJob.COMPLETE) {
    547555        return true;
Note: See TracChangeset for help on using the changeset viewer.