# # ChangeLog for gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl # # Generated by Trac 1.4.2 # 2024-05-01T20:53:43+12:00 Wed, 16 Dec 2015 03:15:39 GMT jmt12 [30354] * gs2-extensions/parallel-building/trunk/src/bin/script/generate_gantt.pl (modified) * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) * gs2-extensions/parallel-building/trunk/src/perllib/FileUtils/HDFSShell.pm (modified) * gs2-extensions/parallel-building/trunk/src/perllib/inexport.pm (modified) * gs2-extensions/parallel-building/trunk/src/src/java/org/nzdl/gsdl/HadoopGreenstoneIngest.java (modified) * gs2-extensions/parallel-building/trunk/src/src/java/org/nzdl/gsdl/HadoopGreenstoneIngest2.java (modified) Extending manifest v2 support to allow for directories to be listed ... Fri, 09 Aug 2013 01:16:06 GMT jmt12 [28015] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Add an extra option that allows me to pass in the directory to write ... Sun, 21 Jul 2013 22:37:02 GMT jmt12 [27913] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Made the ingester to be used (version 1 without reduce phase, or ... Tue, 02 Jul 2013 02:35:42 GMT jmt12 [27732] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Nice the copy itself too Fri, 21 Jun 2013 00:25:32 GMT jmt12 [27686] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) A little more progress comments Mon, 17 Jun 2013 22:59:52 GMT jmt12 [27654] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) * gs2-extensions/parallel-building/trunk/src/src/java/org/nzdl/gsdl/HadoopGreenstoneIngest.java (modified) Add the ability to stagger the starting of Mappers by placing a ... Mon, 17 Jun 2013 22:31:34 GMT jmt12 [27644] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Extended to support HDFS-access via NFS. This applies to both the ... Mon, 10 Jun 2013 05:09:36 GMT jmt12 [27594] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Extend hadoop_import.pl to be able to start and stop the Thrift server(s) Sun, 09 Jun 2013 22:23:46 GMT jmt12 [27584] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) I wasn't doing -r when attempting to clear directories left in /tmp ... Wed, 05 Jun 2013 01:06:32 GMT jmt12 [27550] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Ensure the hostname is added to the Hadoop logs so we can identify ... Mon, 03 Jun 2013 23:08:37 GMT jmt12 [27530] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Clear out old logs, and adding more comments about what the script is ... Mon, 27 May 2013 23:38:08 GMT jmt12 [27495] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) removing doubled up debug comments and putting some paths in ... Thu, 23 May 2013 21:24:16 GMT jmt12 [27414] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Allowing more processing arguments to be configured at the call, and ... Mon, 25 Mar 2013 20:14:31 GMT jmt12 [27126] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Extra clean up commands (like removing cached versions of video ... Tue, 12 Mar 2013 00:37:21 GMT jmt12 [27058] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Adding data locality report generation to Hadoop greenstone imports Mon, 04 Mar 2013 22:47:57 GMT jmt12 [27001] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (modified) Passing more environment variables (HADOOPPREFIX, HDFSHOST, HDFSPORT) ... Mon, 25 Feb 2013 21:43:17 GMT jmt12 [26949] * gs2-extensions/parallel-building/trunk/src/bin/script/hadoop_import.pl (added) Parallel import using Hadoop