source: other-projects/nightly-tasks/diffcol/trunk/gen-model-colls.sh@ 37440

Last change on this file since 37440 was 37440, checked in by anupama, 14 months ago

Helpful display message for previous commit

File size: 30.6 KB
Line 
1#!/bin/bash
2
3# PURPOSE
4# This is not a nightly script. You use it to regenerate the model-collections
5# if Greenstone has changed fundamentally, such as what HASH OIDs get assigned
6# to documents or something that changes the contents of the index and
7# archives folders. This has happened now with the commits
8# http://trac.greenstone.org/changeset/28022 and
9# http://trac.greenstone.org/changeset/28021
10# These commits generate new stable HASH OIDs for the existing documents.
11
12
13# USAGE
14# Put this file in the toplevel of the Greenstone 2 binary/compiled SVN installation
15# that you want to generate the model collections with.
16# You can provide a list of collection names or none, in which case all the collections
17# are processed.
18
19# Pass in --svnupdate to copy across the contents of archives and index in the
20# rebuilt collection, overwriting their equivalents in the svn model collection,
21# but not removing any extraneous HASH folders already present.
22# !!!!! IMPORTANT: if you pass in svnupdate, it leaves you to do the final commit on
23# the (svn) model-collect folder!
24
25# Pass in --svndelete to remove the archives and index from svn in the model-collect
26# and replace this with the rebuilt archives and index
27# The --svndelete is useful for when the HASH directory naming has changed and everything
28# in archives and index has to be wiped out and moved back in from the rebuilt col.
29# Passing in --svndelete will do the final commits on the model-collect folder.
30
31# If neither flag is passed in, then the collections are rebuilt but the svn model-collect
32# is not updated and the repository is not updated.
33
34# Examples of usage:
35# ./gen-model-colls.sh
36# ./gen-model-colls.sh --svndelete
37# ./gen-model-colls.sh --svnupdate Tudor-Basic Tudor-Enhanced
38
39# The first just rebuilds all the collections in a new folder called collect and stops there
40
41# The second rebuilds all the collections in collect and svn removes the archives and the index
42# folders in model-collect. Then it copies across the rebuilt archives and index into model-collect
43# and svn adds them.
44
45# The third example checks out all the model-collections again, but rebuilds only the 2 collections
46# specified in the new collect folder. Then it copies across the *contents* of the archives and
47# index folders of those 2 collections into their model-collect equivalents. You then still have to
48# do the final svn commit on the model-collect folder after looking over the differences.
49
50# Also valid examples:
51# ./gen-model-colls.sh Tudor-Basic Tudor-Enhanced
52# ./gen-model-colls.sh --svndelete Tudor-Basic Tudor-Enhanced
53# ./gen-model-colls.sh --svnupdate
54
55# PSEUDOCODE
56# This script:
57# Checks out the model-collections folder from SVN
58# Makes a copy
59# In the copy: gets rid of their .svn folders, and builds each collection in turn, moving building to index once done
60# If --svndelete was passed in: svn removes model-collect/archives and model-collect/index, copies over collect/index
61# and collect/archives into model-collect and svn adds model-collect/archives and model-collect/index. Then SVN COMMITS
62# model-collect/archives and model-collect/index.
63# If --svnupdate was passed in: copies collect/archives/* into model-collect/archives/*, and copies collect/index/*
64# into model-collect/index/*, overwriting files that already existed but have now been updated upon rebuild. However,
65# --svnupdate will leave untouched any files and folders unique to model-collect. No SVN commit, that's LEFT UP TO YOU.
66
67# See earlier version of this script:
68# To svn remove what's unique to model-collect and svn add what's been rebuilt in index and archives
69# see http://stackoverflow.com/questions/7502261/delete-folder-content-and-remove-from-version-control
70
71# http://stackoverflow.com/questions/5044214/how-do-i-detect-and-or-delete-empty-subversion-directories
72# http://stackoverflow.com/questions/1301203/removing-svn-files-from-all-directories
73
74# To checkout just this file and other files at this level from trac, see
75# http://stackoverflow.com/questions/11650156/svn-checkout-depth
76# http://svnbook.red-bean.com/en/1.7/svn.advanced.sparsedirs.html
77# So you would do:
78# svn co http://svn.greenstone.org/other-projects/nightly-tasks/diffcol/trunk diffcol --depth files
79
80#*******************************GLOBAL VARIABLES***************************
81
82# mode can be svndelete or svnupdate
83mode=
84debug_mode=0
85commit_message=
86
87#*****************************FUNCTIONS*****************************
88
89# DON'T ADD ANY FURTHER ECHO STATEMENTS IN FUNCTION get_col_basename
90# "you have to be really careful on what you have in this function, as having any code which will eventually echo will mean that you get incorrect return string."
91# see http://stackoverflow.com/questions/3236871/how-to-return-a-string-value-from-a-bash-function
92function get_col_basename () {
93 collection=$1
94
95 #escape the filename (in case of space)
96 collection=`echo $collection | sed 's@ @\\\ @g'`
97
98 #get just the basename
99 collection=`basename $collection`
100
101 # returning a string does not work in bash
102 # see http://stackoverflow.com/questions/3236871/how-to-return-a-string-value-from-a-bash-function
103
104 #return $collection
105 echo $collection
106}
107
108# model-collect>svn -R propset svn:ignore -F .customignore .
109# where .customignore is a file containing:
110# log
111# earliestDatestamp
112# cache
113# model-collect>svn proplist -v
114# shows the svn properties, including the svn:ignore property. So it shows what files svn will ignore
115function svn_add_new_collection () {
116
117 collection=$1
118
119 #escape the filename (in case of space) and get just the basename
120 collection=$(get_col_basename $collection)
121
122 if [ -e model-collect/$collection ];then
123 echo "svn_add_new_collection: $collection already exists in model-collect, can't add it to svn."
124 return
125 fi
126
127 # Using rsync to copy folders while excluding files/subfolders, BUT rsync is not available on lsb
128 # http://www.linuxquestions.org/questions/linux-software-2/copy-svn-working-dir-without-svn-hidden-dirs-and-files-620586/
129 # See also http://www.thegeekstuff.com/2011/01/rsync-exclude-files-and-folders/,
130 # section "Exclude multiple files and directories at the same time" (can also use a file to blacklist folders/files)
131
132 # for GS3 we have a custom ignore file
133# if [ "x$GSDL3SRCHOME" != "x" ]; then
134# mkdir model-collect/$collection
135# svn add --force model-collect/$collection
136# svn propset -R svn:ignore -F model-collect/.customignore model-collect/$collection
137#
138# if [ "x$commit_message" == "x" ]; then
139# commit_message="Adding new model collections 1/2: new empty collection dir with svn-ignore set."
140# fi
141# if [ "$debug_mode" -eq "0" ]; then
142# svn commit -m "AUTOCOMMIT by gen-model-colls.sh script. Message: $commit_message" model-collect/$collection
143# fi
144# fi
145
146
147 # need slash on end of src dir collect/$collection/ !
148 rsync -r --exclude=.svn/ --exclude=log/ --exclude=cached/ --exclude=cache/ --exclude=earliestDatestamp --exclude=fail.log --exclude=collectionConfig.bak collect/$collection/ model-collect/$collection
149
150# find collect/$collection -name ".svn" -type d -exec rm -rf {} \;
151# cp -r collect/$collection model-collect/$collection
152
153 # http://www.thegeekstuff.com/2010/06/bash-array-tutorial/
154# ignorelist=('log' 'cache' 'archives/earliestDatestamp');
155# for ignored in "${ignorelist[@]}"; do
156# if [ -f model-collect/$collection/$ignorelist ]; then
157# rm model-collect/$collection/$ignorelist
158# elif [ -d model-collect/$collection/$ignorelist ]; then
159# rm -rf model-collect/$collection/$ignorelist
160# fi
161# done
162
163 svn add --force model-collect/$collection
164
165 # http://stackoverflow.com/questions/15880249/subclipse-svn-first-commit-ignore-certain-directories
166 # http://wolfram.kriesing.de/blog/index.php/2005/svnignore-and-svnkeywords
167 # http://boblet.tumblr.com/post/35755799/setting-up-and-using-svn-ignore-with-subversion
168 # http://www.petefreitag.com/item/662.cfm
169 # http://svnbook.red-bean.com/en/1.7/svn.advanced.props.special.ignore.html
170 # http://stackoverflow.com/questions/116074/how-to-ignore-a-directory-with-svn
171
172 # Dr Bainbridge's way of doing an svn ignore is better and involves fewer steps:
173 # create the empty collection folder (-p for subcollections), svn add it,
174 # svn:ignore all the files to be ignored
175 # copy the contents of the collection across,
176 # do an svn add --force on the collection folder
177
178 #mkdir -p model-collect/$collection
179 #svn add model-collect/$collection
180 #ignorelist=('log' 'cache' 'archives/earliestDatestamp');
181 #for ignored in "${ignorelist[@]}"; do
182 # svn propset svn:ignore $ignorelist model-collect/$collection/.
183 #done
184 # cp -r collect/$collection/* model-collect/$collection/*
185 #svn add --force model-collect/$collection
186}
187
188# Function that handles the --svndelete flag (mode) of this script for a single collection
189function svn_delete () {
190
191 # svn remove archives and index in each collection
192 # commit them all
193 # copy over newly rebuilt archives and index into each model-collection
194 # svn add the new archives and index folders of each collection
195 # commit them all
196
197
198 # make a space-separated list of all the collections
199 # to keep track of which ones should be committed from the model-collect folder
200 concatlist=
201
202 if [ "x$1" == "x" ]; then
203 for collection in collect/*; do
204 _del_col_archives_index $collection
205 concatlist="$concatlist model-$collection"
206 done
207 else
208 for collection in "$@"; do
209 _del_col_archives_index $collection
210 concatlist="$concatlist model-collect/$collection"
211 done
212 fi
213
214 # svn commit in one go all the svn rm statements done above:
215 # don't do `svn up` at this point, as doing so will then retrieve all the folders that just were svn-removed
216
217 if [ "x$commit_message" == "x" ]; then
218 commit_message="Clean rebuild of model collections 1/2. Clearing out deprecated archives and index."
219 fi
220
221 # Numerical comparisons: http://tldp.org/LDP/abs/html/comparison-ops.html
222 if [ "$debug_mode" -eq "0" ]; then
223 svn commit -m "AUTOCOMMIT by gen-model-colls.sh script. Message: $commit_message" model-collect #$concatlist
224 fi
225
226 # Having svn committed the deletes, do an svn up to locally delete what was svn-removed above,
227 # BEFORE copying from the rebuilt archives and index folders
228 if [ "$debug_mode" -eq "0" ]; then
229 svn up model-collect #/$concatlist
230 fi
231
232 # copy from the rebuilt archives and index over into the svn model-collect and svn add them
233 if [ "x$1" == "x" ]; then
234 for collection in collect/*; do
235 _add_col_archives_index $collection
236 done
237 else
238 for collection in "$@"; do
239 _add_col_archives_index $collection
240 done
241 fi
242
243 # commit all the svn add statements done just above in one go
244 if [ "x$commit_message" == "x" ]; then
245 commit_message="Clean rebuild of model collections 2/2. Adding rebuilt archives and index."
246 fi
247
248 if [ "$debug_mode" -eq "0" ]; then
249 svn commit -m "AUTOCOMMIT by gen-model-colls.sh script. Message: $commit_message" model-collect #$concatlist
250 fi
251
252 echo
253 echo "*********************"
254 echo "Done svn-deleting rebuilt model-collection: $collection"
255 echo "*********************"
256 echo
257}
258
259# To undo the changes made by svndelete, run the following manually
260# svn revert --depth infinity <model-collect/$collection/archives/*
261# svn revert --depth infinity <model-collect/$collection/archives/*
262# then remove both the local archives and index, and do an svn up to get original checkout back
263
264# svn delete this collection's archives and index folders
265# (On returning from this subroutine, the commit will be done in one step for all collections on which this function was called)
266function _del_col_archives_index () {
267 collection=$1
268
269 #escape the filename (in case of space) and get just the basename
270 collection=$(get_col_basename $collection)
271
272 if [ ! -e model-collect/$collection ]; then
273 echo "del_col_archives_index: $collection does not exist in model-collect"
274 return;
275 fi
276
277 # remove the entire archives and index folders from svn
278 if [ "$debug_mode" -eq "0" ]; then
279 svn rm --force model-collect/$collection/archives
280 svn rm --force model-collect/$collection/index
281 elif [ "$debug_mode" -eq "1" ]; then
282 rm -rf model-collect/$collection/archives
283 rm -rf model-collect/$collection/index
284 fi
285
286}
287
288
289# copy and then svn add the collection's archives and index folders
290function _add_col_archives_index () {
291 collection=$1
292
293 #escape the filename (in case of space) and get just the basename
294 collection=$(get_col_basename $collection)
295
296 if [ ! -e model-collect/$collection ]; then
297 echo "add_col_archives_index: $collection does not exist in model-collect"
298 return;
299 fi
300
301 # copy across collect.cfg file if it has been modified
302 `diff collect/$collection/etc/collect.cfg model-collect/$collection/etc/collect.cfg`
303 status=$?
304 if [ "$status" -eq "1" ]; then
305 cp collect/$collection/etc/collect.cfg model-collect/$collection/etc/collect.cfg
306 fi
307
308 # copy across the entire rebuilt index and archives folders to the svn model-collect
309 rsync -r --exclude=.svn/ --exclude=cached/ --exclude=cache/ --exclude=earliestDatestamp collect/$collection/archives model-collect/$collection
310 rsync -r --exclude=.svn/ --exclude=cached/ --exclude=cache/ collect/$collection/index model-collect/$collection
311
312 # need a --force to skip all the svn:ignored files (archives/earliestDatestamp)
313 # when doing the recursive svn add on the archives and index directories
314 if [ "$debug_mode" -eq "0" ]; then
315 svn add --force model-collect/$collection/archives
316 svn add --force model-collect/$collection/index
317 fi
318}
319
320
321# UNUSED, but useful for spotting differences between the collect and model-collect
322# after rebuild, before svn updating/deleting, as opposed to at the end of the script
323function svn_process_single_collection () {
324 collection=$1
325
326 #escape the filename (in case of space) and get just the basename
327 collection=$(get_col_basename $collection)
328
329 if [ ! -e model-collect/$collection ]; then
330 echo "svn_process_single_collection: $collection does not exist in model-collect"
331 return;
332 fi
333
334# return here if just deleting empty dirs
335#return
336
337 # diff the svn model and rebuilt model collections
338 diff_result=`diff -rq model-collect/$collection collect/$collection | grep -v ".svn"`
339# echo "Diff result for collection $collection: $diff_result"
340
341 # if no differences in the current collection, then we're done
342 if [ "x$diff_result" == "x" ]; then
343 echo "No differences in collection $collection"
344 return;
345 fi
346
347 # check that none of the lines mention files outside the archives or index folders
348 # http://en.gibney.org/tell_the_bash_to_split_by_newline_charac
349 # http://forums.gentoo.org/viewtopic-p-3130541.html
350
351 # http://wi-fizzle.com/article/276
352 # http://stackoverflow.com/questions/918886/how-do-i-split-a-string-on-a-delimiter-in-bash
353 # http://www.linuxquestions.org/questions/programming-9/split-a-string-on-newlines-bash-313206/
354 # http://unix.stackexchange.com/questions/39473/command-substitution-splitting-on-newline-but-not-space
355
356 # store backup of Internal Field Separator value, then set IFS to newline for splitting on newline
357
358 IFS_BAK=$IFS
359# IFS='\n' # splits on all whitespace
360IFS='
361'
362 # in the lines returned from the diff, test for archives or newline
363 # http://stackoverflow.com/questions/229551/string-contains-in-bash
364 for line in `diff -rq model-collect/$collection collect/$collection | grep -v ".svn"`; do
365 # echo "LINE: $line"
366 if [[ "$line" != *archives* && "$line" != *index* ]]; then
367 # the file that is different is neither in index nor in archives, send this diffline to the report
368 echo $line >> report.txt
369 fi
370 done
371
372 IFS=$IFS_BAK
373 IFS_BAK=
374}
375
376# Function that takes care of the --svnupdate flag mode of this script for a single collection
377function update_single_collection () {
378 collection=$1
379
380 #escape the filename (in case of space) and get just the basename
381 collection=$(get_col_basename $collection)
382
383 if [ ! -e model-collect/$collection ]; then
384 echo "update_single_collection: $collection does not exist in model-collect"
385 return;
386 fi
387
388 # copy across collect.cfg file if it has been modified
389 `diff collect/$collection/etc/collect.cfg model-collect/$collection/etc/collect.cfg`
390 status=$?
391 if [ "$status" -eq "1" ]; then
392 cp collect/$collection/etc/collect.cfg model-collect/$collection/etc/collect.cfg
393 fi
394
395 # copy across the contents of the rebuilt model-collection's index and archives to the svn model-collect
396 rsync -r --exclude=.svn/ --exclude=cached/ --exclude=cache/ --exclude=earliestDatestamp collect/$collection/archives/* model-collect/$collection/archives
397 rsync -r --exclude=.svn/ --exclude=cached/ --exclude=cache/ collect/$collection/index/* model-collect/$collection/index
398
399 # now svn add any and all the NEW items in model-collect's archives and index
400 # see http://stackoverflow.com/questions/1071857/how-do-i-svn-add-all-unversioned-files-to-svn
401 # see also http://stackoverflow.com/questions/116074/how-to-ignore-a-directory-with-svn
402# if [ "$debug_mode" -eq "0" ]; then
403 svn add --force model-collect/$collection/archives/* --auto-props --parents --depth infinity -q
404 svn add --force model-collect/$collection/index/* --auto-props --parents --depth infinity -q
405# fi
406
407 echo "svn model-collect update process complete. CHECK AND COMMIT THE model-collect FOLDER!"
408
409 # if etc/collect.cfg is different, copy it across too?
410
411 echo
412 echo "*********************"
413 echo "Done updating the rebuilt LOCAL model-collection: model-collect/$collection"
414 echo "*********************"
415 echo
416}
417
418
419# re-build a single collection in "collect" which is a copy of model-collect
420function build_single_collection () {
421 collection=$1
422
423 collection=$(get_col_basename $collection)
424
425 # GS2 or GS3 building
426 if [ "x$GSDL3SRCHOME" == "x" ]; then
427 import.pl -removeold $collection;
428 buildcol.pl -removeold $collection;
429 else
430 import.pl -site localsite -removeold $collection
431 buildcol.pl -site localsite -removeold $collection
432 fi
433
434 rm -rf collect/$collection/index
435 mv collect/$collection/building collect/$collection/index
436
437 echo
438 echo "*********************"
439 echo "Done rebuilding model collection: $collection"
440 echo "*********************"
441 echo
442}
443
444
445# http://stackoverflow.com/questions/16483119/example-of-how-to-use-getopt-in-bash
446function usage() {
447# usage() { echo "Usage: $0 [-s <45|90>] [-p <string>]" 1>&2; exit 1; }
448
449 echo "*******************************************"
450 echo "Usage: $0 [--svnupdate|--svndelete|--svnaddnew] [--debug] [--message 'custom commit message'] [col1, col2, col3,...]";
451 echo "If no collections are provided, all collections will be processed.";
452 echo "If none of svnupdate, svndelete or svnaddnew are provided,"
453 echo "the specified collections are just rebuilt in the collect folder.";
454 echo "*******************************************"
455 exit 1;
456}
457
458
459#*******************************MAIN PROGRAM***************************
460
461# process optional command line arguments
462# http://blog.onetechnical.com/2012/07/16/bash-getopt-versus-getopts/
463# Execute getopt
464ARGS=$(getopt -o m:uxadh -l "message:,svnupdate,svndelete,svnaddnew,debug,help" -n "$0" -- "$@");
465
466#Bad arguments
467if [ $? -ne 0 ];then
468 usage
469 exit 1
470fi
471
472eval set -- "$ARGS";
473
474
475# -n: http://tldp.org/LDP/abs/html/testconstructs.html
476while true; do
477 case "$1" in
478 -h|--help)
479 shift;
480 usage
481 exit 0
482 ;;
483 -a|--svnaddnew)
484 shift;
485 if [ "x$mode" == "xsvnupdate" ] || [ "x$mode" == "xsvndelete" ]; then
486 echo
487 echo "Can't use both svnaddnew and svndelete/svnupdate"
488 usage
489 exit 1
490 else
491 mode=svnaddnew
492# echo "svnaddnew not yet implemented"
493# exit 0
494 fi
495 ;;
496 -x|--svndelete)
497 shift;
498 if [ "x$mode" == "xsvnupdate" ] || [ "x$mode" == "xsvnaddnew" ]; then
499 echo
500 echo "Can't use both svndelete and svnupdate/svnaddnew"
501 usage
502 exit 1
503 else
504 mode=svndelete
505 fi
506 ;;
507 -u|--svnupdate)
508 shift;
509 if [ "x$mode" == "xsvndelete" ] || [ "x$mode" == "xsvnaddnew" ]; then
510 echo
511 echo "Can't use both svnupdate and svndelete/svnaddnew"
512 usage
513 exit 1
514 else
515 mode=svnupdate
516 fi
517 ;;
518 -d|--debug)
519 shift;
520 debug_mode=1
521 ;;
522 -m|--message)
523 shift;
524 if [ -n "$1" ]; then
525 commit_message=$1
526 shift;
527 fi
528 ;;
529 --)
530 shift;
531 break;
532 ;;
533 esac
534done
535
536#echo "commit message: $commit_message"
537#echo "Debug mode is: $debug_mode"
538#exit
539
540
541# Set up the Greenstone environment, this is mainly for building, but also for locating a
542# Greenstone installation folder, in case this script doesn't live in one.
543# Then cd into the collect folder's parent for the Greenstone installation.
544# Test for GS3 home env then for GS2 home and if found, cd into the GS2/GS3 home location and
545# run setup, else try to find setup.bash/gs3-setup.bash in the current location and run it.
546# Else print a warning message saying that GSDLHOME is not set.
547if [ "$GSDL3SRCHOME" != "" ]; then
548 echo "cd-ing into Greenstone 3 home directory: $GSDL3SRCHOME"
549 cd "$GSDL3SRCHOME/web/sites/localsite"
550elif [ "$GSDLHOME" != "" ]; then
551 echo "cd-ing into Greenstone home directory: $GSDLHOME"
552 cd "$GSDLHOME"
553else
554 echo "** No GS envvars set. Attempting to source the Greenstone setup script"
555 if [ -e gs3-setup.sh ]; then
556 source ./gs3-setup.sh
557 cd "$GSDL3SRCHOME/web/sites/localsite"
558 elif [ -e setup.bash ]; then
559 source ./setup.bash
560 else
561 echo "No Greenstone Home set and no setup script found in current folder."
562 echo "You need to source the setup script in a Greenstone installation. Exiting."
563 exit -1
564 fi
565fi
566
567
568# If no mode provided (svndelete|svnupdate) as cmd line arg, then don't modify
569# the svn model-collect folder. Then this script stops after rebuilding the model-copy in collect
570
571# the remaining arguments to the script are assumed to be collections
572
573# debugging
574#for collection in "$@"; do
575# collection=collect/$collection
576# echo "Collection: $collection"
577#done
578
579# finished processing arguments
580
581
582# report will contain the output of the diff for
583if [ -f report.txt ]; then
584 rm report.txt
585fi
586
587# Need the pdfbox extension for the PDFBox tutorial
588# The PDFBox ext has to be placed in the *GSDLHOME*/ext,
589# also in GS3's case where GSDLHOME is GS3/gs2build/ext
590# Go into ext and at end popd to get back into the collect folder's parent for the GS installation
591if [ ! -e "$GSDLHOME/ext/pdf-box" ]; then
592 echo "** Getting PDFBox"
593 pushd "$GSDLHOME/ext"
594 if [ ! -e "$GSDLHOME/ext/pdf-box-java.tar.gz" ]; then
595 wget --no-check-certificate https://trac.greenstone.org/export/head/gs2-extensions/pdf-box/trunk/pdf-box-java.tar.gz
596 fi
597 tar -xvzf pdf-box-java.tar.gz
598 popd
599fi
600# for GS2 need to make PDFv2Plugin.tmp functional, now that we have pdfbox
601if [ -e "$GSDLHOME/ext/pdf-box" ]; then
602 if [ -e "$GSDLHOME/perllib/plugins/PDFv2Plugin.tmp" ]; then
603 echo "** Renameing PDFv2Plugin.tmp to PDFv2Plugin.pm to work with pdf-box"
604 mv "$GSDLHOME/perllib/plugins/PDFv2Plugin.tmp" "$GSDLHOME/perllib/plugins/PDFv2Plugin.pm"
605 fi
606fi
607
608
609# move the existing collect folder out of the way
610# unless we are adding a new collection to svn, in which case, we'll grab them from whatever collect folder exists
611if [ "x$mode" != "xsvnaddnew" ] && [ -e collect ] && [ ! -e collect_orig ]; then
612 echo "** Moving collect out of the way"
613 mv collect collect_orig
614fi
615
616
617# get model-collect from svn
618# if we already have it, svn update the entire model-collect folder if processing all collections
619# or svn update just any collections specified in the model-collect folder
620if test -e model-collect; then
621 echo "** SVN updating model-collect"
622 if [ "$1" == "" ]; then
623 svn up model-collect
624 else
625 for collection in "$@"; do
626 svn up model-collect/$collection
627 done
628 fi
629else
630 echo "** Getting the model-collect folder from SVN"
631 if [ "$GSDL3SRCHOME" != "" ]; then
632 svn co http://svn.greenstone.org/other-projects/nightly-tasks/diffcol/trunk/gs3-model-collect model-collect
633 else
634 svn co http://svn.greenstone.org/other-projects/nightly-tasks/diffcol/trunk/model-collect
635 fi
636fi
637
638
639# Not using rsync to copy folders while excluding files/subfolders, since rsync is not available on lsb
640# http://www.linuxquestions.org/questions/linux-software-2/copy-svn-working-dir-without-svn-hidden-dirs-and-files-620586/
641# rsync -r --exclude=.svn/ model-collect/ collect
642
643# Make a copy of the model-collect named as the new collect
644# (or if collections are specified in the cmdline arguments, copy just these over from model-collect into collect)
645# Then remove the copy's .svn folders
646if [ "x$mode" != "xsvnaddnew" ] && [ -e collect_orig ]; then
647
648 echo "***********************************************"
649 echo "Creating a copy of the model-collect folder as folder collect and removing the .svn subfolders from the copy:"
650 echo
651
652 if [ ! -e collect ]; then
653 cp -r model-collect collect
654 find collect -name ".svn" -type d -exec rm -rf {} \; #2>&1 > /dev/null
655 else
656 if [ "$1" == "" ]; then
657 rm -rf collect
658 cp -r model-collect collect
659 find collect -name ".svn" -type d -exec rm -rf {} \;
660 else
661 for collection in "$@"; do
662 if [ -e collect/$collection ]; then
663 rm -rf collect/$collection
664 fi
665 cp -r model-collect/$collection collect/$collection
666 find collect/$collection -name ".svn" -type d -exec rm -rf {} \;
667 done
668 fi
669 fi
670 echo "***********************************************"
671fi
672
673
674# parse arguments
675# http://stackoverflow.com/questions/12711786/bash-convert-command-line-arguments-into-array
676# http://stackoverflow.com/questions/255898/how-to-iterate-over-arguments-in-bash-script
677
678if [ "$1" == "" ]; then
679
680 # all_collections
681 #for each collection, import, build, move building to index
682 for collection in collect/*; do
683 build_single_collection $collection;
684
685 if [ "x$mode" != "x" ]; then
686 #svn_process_single_collection $collection
687
688 if [ "x$mode" == "xsvnupdate" ]; then
689 update_single_collection $collection
690 elif [ "x$mode" == "xsvnaddnew" ]; then
691 svn_add_new_collection $collection
692 fi
693 fi
694 done
695
696 # having rebuilt all the collections, just the processing for svndelete remains:
697 if [ "x$mode" == "xsvndelete" ]; then
698 svn_delete
699 fi
700
701else
702 # Command-line args are a list of collections,
703 # process each command-line arg, after confirming such a collection exists
704
705 for collection in "$@"; do
706 collection=collect/$collection
707 if test -e $collection; then
708 build_single_collection $collection;
709
710 if [ "x$mode" != "x" ]; then
711 #svn_process_single_collection $collection
712
713 if [ "x$mode" == "xsvnupdate" ]; then
714 update_single_collection $collection
715 elif [ "x$mode" == "xsvnaddnew" ]; then
716 svn_add_new_collection $collection
717 fi
718 fi
719 else
720 echo
721 echo "Can't find collection $collection. Skipping."
722 echo
723 fi
724 done
725
726 # having rebuilt the specified collections above, just the processing for svndelete remains
727 if [ "x$mode" == "xsvndelete" ]; then
728 svn_delete $@
729 fi
730fi
731
732
733echo
734echo "*****************************************"
735echo
736# NO LONGER NECESSARY: WE'RE DOING A DIFF BETWEEN collect AND model-collect AT THIS SCRIPT'S END
737# if we were svn updating/deleting collections, then mode was set
738# if in that case a report was generated with additional differences, point the user to it
739#if [ -f report.txt ] && [ "x$mode" != "x" ]; then
740# echo "Some files or folders outside of archives and index directories were different. See report.txt"
741# echo
742#fi
743
744# if not svnupdating or svndeleting, then inform the user that model-collect is unchanged
745# if svnupdating, then warn the user that model-collect still needs committing
746# if svndeleting, then inform the user that model-collect has been changed and committed
747if [ "x$mode" == "x" ]; then
748 echo "* The model-collect folder has not been altered. Changes have only been made to collect"
749elif [ "x$mode" == "xsvnupdate" ]; then
750 echo "* TO DO: You still need to run svn status and svn commit on the model-collect folder. Besides that:"
751elif [ "x$mode" == "xsvndelete" ]; then
752 echo "* The model-collect folder's archives and index subfolders have been updated and committed to svn."
753elif [ "x$mode" == "xsvnaddnew" ]; then
754 echo "* The new collection(s) have been built, copied to model-collect and added to svn."
755 echo "* TO DO: You still need to run svn status and svn commit on the model-collect folder. Besides that:"
756fi
757echo
758
759if [ "x$mode" != "x" ]; then
760 echo "* DIFFERENCES REMAINING BETWEEN model-collect AND collect (skipping .svn folders):"
761 echo
762 if [ "$1" == "" ]; then
763 echo "---START DIFF---"
764 diff -rq model-collect collect | grep -v ".svn"
765 else
766 for collection in "$@"; do
767 echo "--COLLECTION: $collection"
768 diff -rq model-collect/$collection collect/$collection | grep -v ".svn"
769 echo "--"
770 done
771 fi
772 echo "---END DIFF---"
773 echo
774fi
775
776if [ -e collect_orig ]; then
777 echo "* The original collect directory has been left renamed as collect_orig"
778 echo
779fi
780
781if [ "$debug_mode" -eq "1" ]; then
782 echo "* This script was run in DEBUG MODE, nothing has been changed in svn"
783fi
784echo
785echo "*****************************************"
786echo
787
788
789# deletes empty dirs
790# find collect/$collection/archives/HASH* -type d -empty -delete
791# find collect/$collection/index/assoc/HASH* -type d -empty -delete
792
793# To recursively delete all empty dirs in the copy of model-collect (since the dirs will not have .svn folders in them anymore)
794# http://www.commandlinefu.com/commands/view/5131/recursively-remove-all-empty-directories
795#find collect -type d -empty -delete
796
797# The following when put in a separate script file will delete all folders from model-collect that are
798# empty in the copied collection (all folders which contain only a .svn subfolder in model-collect)
799# ---------------------------------------------
800#!/bin/bash
801
802#for collection in collect/*; do
803 #escape the filename (in case of space)
804# collection=`echo $collection | sed 's@ @\\\ @g'`
805
806 #get just the basename
807# collection=`basename $collection`
808
809 # HASH dirs that are empty in local collect's archives and index/assoc,
810 # need to be removed from the svn in model-collect
811
812# for line in `find collect/$collection/archives/HASH* -type d -empty`; do
813# modelline="model-$line"
814# echo "LINE: $modelline"
815
816 # remove from svn of model collect
817# svn rm $modelline
818## rm -rf $modelline
819 # remove physically from local collect
820# rm -rf $line
821# done
822
823# for line in `find collect/$collection/index/assoc/HASH* -type d -empty`; do
824# modelline="model-$line"
825# echo "LINE: $modelline"
826
827 # remove from svn of model collect
828# svn rm $modelline
829## rm -rf $modelline
830 # remove physically from local collect
831# rm -rf $line
832# done
833
834#done
835# ---------------------------------------------
Note: See TracBrowser for help on using the repository browser.