Mercurial > ec-dotfiles
annotate moefetch.sh @ 213:dd95cf01602c
working around limit
author | edhoprima@gmail.com <edhoprima@gmail.com> |
---|---|
date | Tue, 30 Jun 2009 09:23:02 +0000 |
parents | da4c03c7377c |
children | a6624fb9b317 |
rev | line source |
---|---|
148 | 1 #!/bin/sh |
2 | |
3 # Copyright (c) 2009, edogawaconan <me@myconan.net> | |
4 # | |
5 # Permission to use, copy, modify, and/or distribute this software for any | |
6 # purpose with or without fee is hereby granted, provided that the above | |
7 # copyright notice and this permission notice appear in all copies. | |
8 # | |
9 # THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES | |
10 # WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF | |
11 # MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR | |
12 # ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES | |
13 # WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN | |
14 # ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF | |
15 # OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. | |
159 | 16 # |
17 # Lots of bugs here. Use with care | |
148 | 18 # USE WITH CARE |
159 | 19 # |
20 # what it does: fetch every picture that has the specified TAGS. | |
148 | 21 # requirement: wget, libxslt, md5sum (or md5) |
22 | |
159 | 23 # program additional paths for: cut, sed, wc, MD5(sum), wget, xsltproc, grep |
24 ADDITIONAL_PATH= | |
148 | 25 |
159 | 26 # custom md5 path with arguments, expected output: <32digit md5><space(s)><filename> |
27 # Leave empty for "md5sum" (Linux, Solaris), "md5 -r" (*BSD) | |
28 MD5= | |
148 | 29 |
159 | 30 # default server address. Danbooru only! I do not take responsibility of stupidity. |
31 DEFAULT_SITE="moe.imouto.org" | |
148 | 32 |
33 # base directory. make sure it's writeable. I do not take responsibility if you don't own the folder and files as no check is done for this one. | |
159 | 34 # Structure is ${BASE_DIR}/<TAGS> |
35 # Absolute path only. | |
36 # Leave empty to use whatever folder you're running this at | |
193 | 37 BASE_DIR= |
148 | 38 |
39 # not user modifiable from here | |
40 | |
196 | 41 SED_GET_FILENAME="s/.*\/\([^\/]*\)/\1/g" |
42 SED_IS_MD5_FILE="s/\([0-9a-f]\{32\}\..*\)//g" | |
193 | 43 |
44 ### TODO: | |
211 | 45 ### - sanity validator(?) |
193 | 46 ### - unified repository to save bandwidth |
47 ### - bug stomping | |
48 ### - sanity checking | |
49 ### WILL BE FOR 0.3 | |
50 | |
159 | 51 # useless welcome message. Also version |
52 Msg_Welcome() { | |
212
da4c03c7377c
fix: count folder doesn't work on empty folder (messed up when removing 'cd' usage)
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
211
diff
changeset
|
53 MOEFETCHVERSION="0.2.1" |
159 | 54 cat <<EOF |
55 moefetch ${MOEFETCHVERSION} | |
56 Copyright (c) 2009 edogawaconan <me@myconan.net> | |
57 | |
58 EOF | |
59 } | |
60 | |
61 # fatal error handler | |
62 Err_Fatal() { | |
196 | 63 printf "\nFatal error: ${1}\n" |
159 | 64 exit 1 |
65 } | |
66 | |
67 # help message | |
68 Err_Help() { | |
69 cat <<EOF | |
177 | 70 moefetch.sh COMMAND [-s SITE_URL] TAGS |
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
71 |
176
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
72 COMMAND: |
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
73 (quick)fetch: do a complete update. Add prefix quick to skip file checking |
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
74 check: get list of new files, clean up local folder and print total new files |
175
5b7a154dbd21
cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
174
diff
changeset
|
75 |
177 | 76 -s SITE_URL: Specify URL of the Danbooru powered site you want to leech from. Default is ${DEFAULT_SITE} |
175
5b7a154dbd21
cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
174
diff
changeset
|
77 |
176
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
78 TAGS: Tags you want to download. Separated by spaces. Tag name follows standard Danbooru tagging scheme |
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
79 |
159 | 80 EOF |
193 | 81 exit 2 |
159 | 82 } |
83 | |
84 # generate link by transforming xml | |
85 Generate_Link() { | |
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
86 printf "\nFetching xml file\n" |
213
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
87 TEMPNUM=1001 |
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
88 _i=1 |
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
89 > "${TEMP_PREFIX}-list" |
213
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
90 while [ "${TEMPNUM}" -ge 1000 ]; do |
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
91 wget "http://${SITE}/post/index.xml?tags=${TAGS}&offset=0&limit=1000&page=${_i}" -O "${TEMP_PREFIX}-xml" -e continue=off |
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
92 printf "Processing XML file..." |
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
93 # xslt evilry |
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
94 > "${TEMP_PREFIX}-templist" |
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
95 xsltproc - "${TEMP_PREFIX}-xml" <<EOF | sed 's/.*\(http.*\)\(\/[a-f0-9]\{32\}\).*\.\([^\.]*\)/\1\2.\3/g' | grep ^http > "${TEMP_PREFIX}-templist" 2>/dev/null |
148 | 96 <xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0"> |
97 <xsl:output method="xml" indent="yes"/> | |
98 <xsl:template match="post"> | |
99 <xsl:value-of select="@file_url" /> | |
100 </xsl:template> | |
101 </xsl:stylesheet> | |
102 EOF | |
213
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
103 TEMPNUM=$(echo $(wc -l < "${TEMP_PREFIX}-templist")) |
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
104 _i=$((_i+1)) |
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
105 cat "${TEMP_PREFIX}-templist" >> "${TEMP_PREFIX}-list" |
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
106 done |
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
107 NUMFILES=$(echo $(wc -l < "${TEMP_PREFIX}-list")) |
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
108 [ "${NUMFILES}" -gt 0 ] || Err_Fatal "Error in processing list or no files can be found with specified tag(s) or site" |
200 | 109 echo " ${NUMFILES} file(s) available on server" |
159 | 110 #output file: ${TARGET_DIR}-list |
148 | 111 } |
112 | |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
113 Progress_Init() { |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
114 _last="-" |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
115 printf "${_last}" |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
116 } |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
117 |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
118 Progress_Anim() { |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
119 case "${_last}" in |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
120 /) _last="-";; |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
121 -) _last=\\;; |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
122 \\) _last=\|;; |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
123 \|) _last="/";; |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
124 esac |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
125 printf "\b${_last}" |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
126 } |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
127 |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
128 Progress_Done() { printf "\bdone\n"; } |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
129 |
200 | 130 # getting rid of ls (as per suggestion) |
131 Count_Files() { | |
132 _i=0 | |
133 for _f in "${*}/"* "${*}/".*; do | |
212
da4c03c7377c
fix: count folder doesn't work on empty folder (messed up when removing 'cd' usage)
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
211
diff
changeset
|
134 if [ "${_f}" != "${*}/"'*' ] || [ -e "${_f}" ]; then |
200 | 135 _i=$((_i + 1)) |
136 fi | |
137 done | |
138 echo $((_i - 2)) | |
139 } | |
140 | |
159 | 141 # check tools availability |
142 Check_Tools() { | |
143 # verify all programs required do indeed exist | |
144 #MD5 | |
145 if [ ! "${MD5}" ]; then | |
193 | 146 case $(uname) in |
159 | 147 *BSD) MD5="md5 -r";; |
148 Linux|SunOS) MD5="md5sum";; | |
149 *) Fatal_Err "No known md5 tool for this platform. Please specify manually" | |
150 esac | |
151 fi | |
193 | 152 MD5_COMMAND=$(echo ${MD5} | cut -d' ' -f1) |
159 | 153 # basic tools |
203 | 154 COMMANDS="cut sed wc wget xsltproc xargs rm mkdir chown comm grep date ${MD5_COMMAND}" |
159 | 155 for COMMAND in ${COMMANDS} |
156 do | |
193 | 157 [ "$(command -v "${COMMAND}")" ] || Err_Fatal "${COMMAND} doesn't exist in ${PATH}" |
159 | 158 done |
159 } | |
160 | |
161 # verify required folders exist and writeable | |
162 Check_Folders(){ | |
163 [ -O "${BASE_DIR}" ] || Err_Fatal "You don't own ${BASE_DIR}. Please fix ${BASE_DIR}." | |
180 | 164 for FOLDER in temp trash deleted "${SITE_DIR}/${TARGET_DIR}"; do |
159 | 165 if [ ! -d "${BASE_DIR}/${FOLDER}" ]; then |
166 mkdir "${BASE_DIR}/${FOLDER}" || Err_Fatal "${FOLDER} folder creation failed" | |
167 fi | |
168 if [ ! -O "${BASE_DIR}/${FOLDER}" ]; then | |
167 | 169 echo "You don't own the ${BASE_DIR}/${FOLDER}, applying globally writeable permission on it" |
159 | 170 chmod -R u=rwX,g=rwX,o=rwX "${BASE_DIR}/${FOLDER}" || Err_Fatal "Error changing ownership. This shouldn't happen" |
171 fi | |
172 done | |
200 | 173 [ "$(Count_Files "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}")" -eq 0 ] && ISNEW=1 |
201
30d2fb656029
scrapping grep -vf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
200
diff
changeset
|
174 for i in error ok list newlist templist; do |
196 | 175 touch "${TEMP_PREFIX}-${i}" || Fatal_Err "Error creating ${TEMP_PREFIX}-${i}. This shouldn't happen" |
159 | 176 done |
177 # | |
178 } | |
179 | |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
180 # Do some cleanup |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
181 Cleanup_Repository() { |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
182 |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
183 # THE FILES |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
184 |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
185 # current dir: ${BASE_DIR}/${SITE_DIR}/${TARGET_DIR} |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
186 printf "Cleaning up repository folder... " |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
187 Progress_Init |
191
a4ceb952b05a
more noclean support code
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
190
diff
changeset
|
188 TRASH_DIR=$(date -u "+${SITE_DIR}-${TARGET_DIR}-%Y%m%d-%H.%M") |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
189 mkdir -p "${BASE_DIR}/trash/${TRASH_DIR}" || Err_Fatal "Unable to create trash folder" |
190
1061a214a1f1
thanks to folks at #bash!
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
189
diff
changeset
|
190 for TRASH in "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}/"* |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
191 do |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
192 ISTRASH= |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
193 if [ -d "${TRASH}" ]; then |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
194 ISTRASH=1 |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
195 else |
203 | 196 if [ "$(echo "${TRASH}" | sed -e "${SED_GET_FILENAME};${SED_IS_MD5_FILE}" | grep -v ^$)" ]; then |
191
a4ceb952b05a
more noclean support code
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
190
diff
changeset
|
197 ISTRASH=1 |
a4ceb952b05a
more noclean support code
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
190
diff
changeset
|
198 else |
196 | 199 [ "$(cat "${TEMP_PREFIX}-list" | sed -e "${SED_GET_FILENAME}" | grep $(echo "${TRASH}" | sed -e "${SED_GET_FILENAME}"))" ] || ISTRASH=1 |
191
a4ceb952b05a
more noclean support code
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
190
diff
changeset
|
200 fi |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
201 fi |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
202 if [ "${ISTRASH}" ]; then |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
203 mv -f "${TRASH}" "${BASE_DIR}/trash/${TRASH_DIR}" || Err_Fatal "Error deleting files" |
209
dbbc4759c285
more aesthetics fix
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
208
diff
changeset
|
204 printf "\bMoved $(echo "${TRASH}" | sed -e "${SED_GET_FILENAME}") to ${BASE_DIR}/trash/${TRASH_DIR}\n${_last}" |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
205 fi |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
206 Progress_Anim |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
207 done |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
208 rmdir "${BASE_DIR}/trash/${TRASH_DIR}" 2>/dev/null |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
209 Progress_Done |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
210 } |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
211 |
159 | 212 # check files correctness |
213 Check_Files() { | |
166 | 214 if [ ! "${ISNEW}" ]; then |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
215 [ "${NOCLEAN}" ] || Cleanup_Repository |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
216 printf "Checking for errors... " |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
217 Progress_Init |
196 | 218 > "${TEMP_PREFIX}-error" |
200 | 219 for FILE in "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}/"* |
159 | 220 do |
203 | 221 if [ "$(echo "${FILE}" | sed -e "${SED_GET_FILENAME};${SED_IS_MD5_FILE}" | grep -v ^$)" ]; then |
209
dbbc4759c285
more aesthetics fix
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
208
diff
changeset
|
222 printf "\bNot a valid danbooru file: $(echo ${FILE} | sed -e "${SED_GET_FILENAME}")\n${_last}" |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
223 else |
200 | 224 if [ "$(${MD5} "${FILE}" | cut -d ' ' -f1 -)" != "$(echo "${FILE}" | sed -e "${SED_GET_FILENAME}" | cut -d '.' -f1)" ] |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
225 then |
196 | 226 echo "${FILE}" >> "${TEMP_PREFIX}-error" |
209
dbbc4759c285
more aesthetics fix
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
208
diff
changeset
|
227 printf "\bError: $(echo "${FILE}" | sed -e "${SED_GET_FILENAME}")\n${_last}" |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
228 fi |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
229 Progress_Anim |
148 | 230 fi |
231 done | |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
232 Progress_Done |
200 | 233 TOTAL_ERROR=$(echo $(wc -l < "${TEMP_PREFIX}-error")) |
170 | 234 if [ "${TOTAL_ERROR}" -eq 0 ]; then |
203 | 235 echo "All files OK" |
170 | 236 else |
203 | 237 printf "${TOTAL_ERROR} file(s) broken: removing..." |
196 | 238 cat "${TEMP_PREFIX}-error" | xargs rm |
203 | 239 echo " ${TOTAL_ERROR} file(s) removed" |
170 | 240 fi |
200 | 241 echo "$(Count_Files "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}") file(s) available locally" |
148 | 242 |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
243 printf "Generating list of new files... " |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
244 Progress_Init |
148 | 245 # THE FILES |
159 | 246 #ls "../${TARGET_DIR}" | grep -vf "${TARGET_DIR}-error" > "${TARGET_DIR}-ok" |
156
d3b002fd944e
fix: my attempt at speeding up things failed. reverting back to trusty grep -vf
edhoprima
parents:
155
diff
changeset
|
247 # |
200 | 248 find "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}" | comm -1 -3 "${TEMP_PREFIX}-error" - | sed -e "${SED_GET_FILENAME}" > "${TEMP_PREFIX}-ok" |
201
30d2fb656029
scrapping grep -vf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
200
diff
changeset
|
249 cat "${TEMP_PREFIX}-list" > "${TEMP_PREFIX}-templist" |
203 | 250 while read -r IS_OK; do |
251 cat "${TEMP_PREFIX}-templist" | grep -v "${IS_OK}" > "${TEMP_PREFIX}-newlist" | |
252 cat "${TEMP_PREFIX}-newlist" > "${TEMP_PREFIX}-templist" | |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
253 Progress_Anim |
203 | 254 done < "${TEMP_PREFIX}-ok" |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
255 Progress_Done |
203 | 256 #cat "${TEMP_PREFIX}-list" | egrep -vf "${TEMP_PREFIX}-ok" > "${TEMP_PREFIX}-newlist" |
198 | 257 echo "$(echo $(wc -l < "${TEMP_PREFIX}-newlist")) file(s) to be downloaded" |
159 | 258 |
148 | 259 else |
159 | 260 if [ "${ISQUICK}" ]; then |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
261 echo "Quick mode selected. Skipping check" |
152 | 262 else |
263 echo "Empty local repository" | |
264 fi | |
200 | 265 cat "${TEMP_PREFIX}-list" > "${TEMP_PREFIX}-newlist" |
148 | 266 fi |
267 } | |
268 | |
159 | 269 # start downloading the images |
270 Fetch_Images() { | |
196 | 271 if [ "$(echo $(wc -l < "${TEMP_PREFIX}-newlist"))" -eq 0 ]; then |
148 | 272 echo "No new file" |
273 else | |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
274 printf "Starting wget... " |
160
68227a30d0b3
forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
159
diff
changeset
|
275 cd "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}" |
196 | 276 wget -e continue=on -bi "${TEMP_PREFIX}-newlist" -o "${TEMP_PREFIX}.log" |
148 | 277 fi |
278 } | |
279 | |
159 | 280 # initialize base variables and initial command check |
281 Init(){ | |
282 # path initialization | |
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
283 [ "${ADDITIONAL_PATH}" ] && PATH="${ADDITIONAL_PATH}:${PATH}" |
159 | 284 export PATH |
158
cba73f6a96bb
grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents:
157
diff
changeset
|
285 |
159 | 286 # misc variables |
166 | 287 ISQUICK= |
288 ISNEW= | |
158
cba73f6a96bb
grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents:
157
diff
changeset
|
289 |
159 | 290 [ $# -lt 2 ] && Err_Help |
291 case "$1" in | |
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
292 check|fetch|quickfetch) |
159 | 293 echo "Starting..." |
294 JOB="$1" | |
295 ;; | |
296 *) | |
297 Err_Help | |
298 ;; | |
299 esac | |
300 shift | |
301 SITE= | |
185
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
302 TAGS= |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
303 while [ "${1}" ]; do |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
304 case "$1" in |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
305 -s|--site) |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
306 shift |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
307 SITE="$1" |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
308 ;; |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
309 -nc|--noclean) |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
310 NOCLEAN=1 |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
311 ;; |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
312 *) |
186 | 313 if [ "${TAGS}" ]; then |
314 TAGS="$1 ${TAGS}" | |
315 else | |
316 TAGS="$1" | |
317 fi | |
185
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
318 ;; |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
319 esac |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
320 shift |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
321 done |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
322 [ "${SITE}" ] || SITE="${DEFAULT_SITE}" |
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
323 [ "${TAGS}" ] || Err_Fatal "No tag specified" |
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
324 # Get base folder - default, current folder or fallback to ${HOME} |
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
325 [ "${BASE_DIR}" ] || BASE_DIR="${PWD}" |
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
326 [ "${BASE_DIR}" ] || BASE_DIR="{$HOME}" |
193 | 327 [ "$(echo "${BASE_DIR}" | cut -c1 | grep \/)" ] || BASE_DIR="/${BASE_DIR}" |
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
328 |
159 | 329 echo "Tags: ${TAGS}" |
330 # slash is not wanted for folder name | |
193 | 331 TARGET_DIR=$(echo "${TAGS}" | sed -e 's/\//_/g') |
332 SITE_DIR=$(echo "${SITE}" | sed -e 's/\/$//g;s/\//_/g') | |
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
333 TEMP_PREFIX="${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}" |
159 | 334 } |
148 | 335 |
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
336 # initialization |
159 | 337 Msg_Welcome |
338 Init "$@" | |
339 Check_Tools | |
340 Check_Folders | |
158
cba73f6a96bb
grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents:
157
diff
changeset
|
341 |
148 | 342 |
159 | 343 # let's do the job! |
344 case "${JOB}" in | |
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
345 check) |
159 | 346 Generate_Link |
347 Check_Files | |
148 | 348 ;; |
159 | 349 fetch) |
350 Generate_Link | |
351 Check_Files | |
352 Fetch_Images | |
353 ;; | |
354 quickfetch) | |
355 ISNEW=1 | |
356 ISQUICK=1 | |
357 Generate_Link | |
358 Check_Files | |
359 Fetch_Images | |
148 | 360 ;; |
361 esac |