Mercurial > ec-dotfiles
annotate moefetch.sh @ 206:a44ba2e495a1
lolfixes
| author | edhoprima@gmail.com <edhoprima@gmail.com> |
|---|---|
| date | Mon, 29 Jun 2009 17:07:26 +0000 |
| parents | 2e866999c042 |
| children | 17d816a63b4c |
| rev | line source |
|---|---|
| 148 | 1 #!/bin/sh |
| 2 | |
| 3 # Copyright (c) 2009, edogawaconan <me@myconan.net> | |
| 4 # | |
| 5 # Permission to use, copy, modify, and/or distribute this software for any | |
| 6 # purpose with or without fee is hereby granted, provided that the above | |
| 7 # copyright notice and this permission notice appear in all copies. | |
| 8 # | |
| 9 # THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES | |
| 10 # WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF | |
| 11 # MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR | |
| 12 # ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES | |
| 13 # WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN | |
| 14 # ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF | |
| 15 # OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. | |
| 159 | 16 # |
| 17 # Lots of bugs here. Use with care | |
| 148 | 18 # USE WITH CARE |
| 159 | 19 # |
| 20 # what it does: fetch every picture that has the specified TAGS. | |
| 148 | 21 # requirement: wget, libxslt, md5sum (or md5) |
| 22 | |
| 159 | 23 # program additional paths for: cut, sed, wc, MD5(sum), wget, xsltproc, grep |
| 24 ADDITIONAL_PATH= | |
| 148 | 25 |
| 159 | 26 # custom md5 path with arguments, expected output: <32digit md5><space(s)><filename> |
| 27 # Leave empty for "md5sum" (Linux, Solaris), "md5 -r" (*BSD) | |
| 28 MD5= | |
| 148 | 29 |
| 159 | 30 # default server address. Danbooru only! I do not take responsibility of stupidity. |
| 31 DEFAULT_SITE="moe.imouto.org" | |
| 148 | 32 |
| 33 # base directory. make sure it's writeable. I do not take responsibility if you don't own the folder and files as no check is done for this one. | |
| 159 | 34 # Structure is ${BASE_DIR}/<TAGS> |
| 35 # Absolute path only. | |
| 36 # Leave empty to use whatever folder you're running this at | |
| 193 | 37 BASE_DIR= |
| 148 | 38 |
| 39 # not user modifiable from here | |
| 40 | |
| 196 | 41 SED_GET_FILENAME="s/.*\/\([^\/]*\)/\1/g" |
| 42 SED_IS_MD5_FILE="s/\([0-9a-f]\{32\}\..*\)//g" | |
| 193 | 43 |
| 44 ### TODO: | |
| 196 | 45 ### - replace `...` with $(..) (DONE) |
| 193 | 46 ### - sanity validator |
| 47 ### - unified repository to save bandwidth | |
| 48 ### - bug stomping | |
| 49 ### - sanity checking | |
| 50 ### WILL BE FOR 0.3 | |
| 51 | |
| 159 | 52 # useless welcome message. Also version |
| 53 Msg_Welcome() { | |
| 203 | 54 MOEFETCHVERSION="0.2-beta2" |
| 159 | 55 cat <<EOF |
| 56 moefetch ${MOEFETCHVERSION} | |
| 57 Copyright (c) 2009 edogawaconan <me@myconan.net> | |
| 58 | |
| 59 EOF | |
| 60 } | |
| 61 | |
| 62 # fatal error handler | |
| 63 Err_Fatal() { | |
| 196 | 64 printf "\nFatal error: ${1}\n" |
| 159 | 65 exit 1 |
| 66 } | |
| 67 | |
| 68 # help message | |
| 69 Err_Help() { | |
| 70 cat <<EOF | |
| 177 | 71 moefetch.sh COMMAND [-s SITE_URL] TAGS |
|
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
72 |
|
176
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
73 COMMAND: |
|
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
74 (quick)fetch: do a complete update. Add prefix quick to skip file checking |
|
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
75 check: get list of new files, clean up local folder and print total new files |
|
175
5b7a154dbd21
cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
174
diff
changeset
|
76 |
| 177 | 77 -s SITE_URL: Specify URL of the Danbooru powered site you want to leech from. Default is ${DEFAULT_SITE} |
|
175
5b7a154dbd21
cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
174
diff
changeset
|
78 |
|
176
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
79 TAGS: Tags you want to download. Separated by spaces. Tag name follows standard Danbooru tagging scheme |
|
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
80 |
| 159 | 81 EOF |
| 193 | 82 exit 2 |
| 159 | 83 } |
| 84 | |
| 85 # generate link by transforming xml | |
| 86 Generate_Link() { | |
|
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
87 printf "\nFetching xml file\n" |
|
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
88 wget "http://${SITE}/post/index.xml?tags=${TAGS}&offset=0&limit=100000" -O "${TEMP_PREFIX}-xml" -e continue=off |
|
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
89 printf "Processing XML file..." |
| 148 | 90 # xslt evilry |
|
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
91 > "${TEMP_PREFIX}-list" |
| 203 | 92 xsltproc - "${TEMP_PREFIX}-xml" <<EOF | sed 's/.*\(http.*\)\(\/[a-f0-9]\{32\}\).*\.\([^\.]*\)/\1\2.\3/g' | grep ^http > "${TEMP_PREFIX}-list" 2>/dev/null |
| 148 | 93 <xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0"> |
| 94 <xsl:output method="xml" indent="yes"/> | |
| 95 <xsl:template match="post"> | |
| 96 <xsl:value-of select="@file_url" /> | |
| 97 </xsl:template> | |
| 98 </xsl:stylesheet> | |
| 99 EOF | |
|
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
100 NUMFILES=$(echo $(wc -l < "${TEMP_PREFIX}-list")) |
|
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
101 [ "${NUMFILES}" -gt 0 ] || Err_Fatal "Error in processing list or no files can be found with specified tag(s) or site" |
| 200 | 102 echo " ${NUMFILES} file(s) available on server" |
| 159 | 103 #output file: ${TARGET_DIR}-list |
| 148 | 104 } |
| 105 | |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
106 Progress_Init() { |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
107 _last="-" |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
108 printf "${_last}" |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
109 } |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
110 |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
111 Progress_Anim() { |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
112 case "${_last}" in |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
113 /) _last="-";; |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
114 -) _last=\\;; |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
115 \\) _last=\|;; |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
116 \|) _last="/";; |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
117 esac |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
118 printf "\b${_last}" |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
119 } |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
120 |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
121 Progress_Done() { printf "\bdone\n"; } |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
122 |
| 200 | 123 # getting rid of ls (as per suggestion) |
| 124 Count_Files() { | |
| 125 _i=0 | |
| 126 for _f in "${*}/"* "${*}/".*; do | |
| 127 if [ "${_f}" != '*' ] || [ -e "${_f}" ]; then | |
| 128 _i=$((_i + 1)) | |
| 129 fi | |
| 130 done | |
| 131 echo $((_i - 2)) | |
| 132 } | |
| 133 | |
| 159 | 134 # check tools availability |
| 135 Check_Tools() { | |
| 136 # verify all programs required do indeed exist | |
| 137 #MD5 | |
| 138 if [ ! "${MD5}" ]; then | |
| 193 | 139 case $(uname) in |
| 159 | 140 *BSD) MD5="md5 -r";; |
| 141 Linux|SunOS) MD5="md5sum";; | |
| 142 *) Fatal_Err "No known md5 tool for this platform. Please specify manually" | |
| 143 esac | |
| 144 fi | |
| 193 | 145 MD5_COMMAND=$(echo ${MD5} | cut -d' ' -f1) |
| 159 | 146 # basic tools |
| 203 | 147 COMMANDS="cut sed wc wget xsltproc xargs rm mkdir chown comm grep date ${MD5_COMMAND}" |
| 159 | 148 for COMMAND in ${COMMANDS} |
| 149 do | |
| 193 | 150 [ "$(command -v "${COMMAND}")" ] || Err_Fatal "${COMMAND} doesn't exist in ${PATH}" |
| 159 | 151 done |
| 152 } | |
| 153 | |
| 154 # verify required folders exist and writeable | |
| 155 Check_Folders(){ | |
| 156 [ -O "${BASE_DIR}" ] || Err_Fatal "You don't own ${BASE_DIR}. Please fix ${BASE_DIR}." | |
| 180 | 157 for FOLDER in temp trash deleted "${SITE_DIR}/${TARGET_DIR}"; do |
| 159 | 158 if [ ! -d "${BASE_DIR}/${FOLDER}" ]; then |
| 159 mkdir "${BASE_DIR}/${FOLDER}" || Err_Fatal "${FOLDER} folder creation failed" | |
| 160 fi | |
| 161 if [ ! -O "${BASE_DIR}/${FOLDER}" ]; then | |
| 167 | 162 echo "You don't own the ${BASE_DIR}/${FOLDER}, applying globally writeable permission on it" |
| 159 | 163 chmod -R u=rwX,g=rwX,o=rwX "${BASE_DIR}/${FOLDER}" || Err_Fatal "Error changing ownership. This shouldn't happen" |
| 164 fi | |
| 165 done | |
| 200 | 166 [ "$(Count_Files "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}")" -eq 0 ] && ISNEW=1 |
|
201
30d2fb656029
scrapping grep -vf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
200
diff
changeset
|
167 for i in error ok list newlist templist; do |
| 196 | 168 touch "${TEMP_PREFIX}-${i}" || Fatal_Err "Error creating ${TEMP_PREFIX}-${i}. This shouldn't happen" |
| 159 | 169 done |
| 170 # | |
| 171 } | |
| 172 | |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
173 # Do some cleanup |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
174 Cleanup_Repository() { |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
175 |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
176 # THE FILES |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
177 |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
178 # current dir: ${BASE_DIR}/${SITE_DIR}/${TARGET_DIR} |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
179 printf "Cleaning up repository folder..." |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
180 Progress_Init |
|
191
a4ceb952b05a
more noclean support code
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
190
diff
changeset
|
181 TRASH_DIR=$(date -u "+${SITE_DIR}-${TARGET_DIR}-%Y%m%d-%H.%M") |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
182 mkdir -p "${BASE_DIR}/trash/${TRASH_DIR}" || Err_Fatal "Unable to create trash folder" |
|
190
1061a214a1f1
thanks to folks at #bash!
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
189
diff
changeset
|
183 for TRASH in "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}/"* |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
184 do |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
185 ISTRASH= |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
186 if [ -d "${TRASH}" ]; then |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
187 ISTRASH=1 |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
188 else |
| 203 | 189 if [ "$(echo "${TRASH}" | sed -e "${SED_GET_FILENAME};${SED_IS_MD5_FILE}" | grep -v ^$)" ]; then |
|
191
a4ceb952b05a
more noclean support code
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
190
diff
changeset
|
190 ISTRASH=1 |
|
a4ceb952b05a
more noclean support code
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
190
diff
changeset
|
191 else |
| 196 | 192 [ "$(cat "${TEMP_PREFIX}-list" | sed -e "${SED_GET_FILENAME}" | grep $(echo "${TRASH}" | sed -e "${SED_GET_FILENAME}"))" ] || ISTRASH=1 |
|
191
a4ceb952b05a
more noclean support code
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
190
diff
changeset
|
193 fi |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
194 fi |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
195 if [ "${ISTRASH}" ]; then |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
196 mv -f "${TRASH}" "${BASE_DIR}/trash/${TRASH_DIR}" || Err_Fatal "Error deleting files" |
| 206 | 197 printf "\nMoved $(echo "${TRASH}" | sed -e "${SED_GET_FILENAME}") to ${BASE_DIR}/trash/${TRASH_DIR}\n${_last}" |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
198 fi |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
199 Progress_Anim |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
200 done |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
201 rmdir "${BASE_DIR}/trash/${TRASH_DIR}" 2>/dev/null |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
202 Progress_Done |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
203 } |
|
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
204 |
| 159 | 205 # check files correctness |
| 206 Check_Files() { | |
| 166 | 207 if [ ! "${ISNEW}" ]; then |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
208 [ "${NOCLEAN}" ] || Cleanup_Repository |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
209 printf "Checking for errors..." |
|
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
210 Progress_Init |
| 196 | 211 > "${TEMP_PREFIX}-error" |
| 200 | 212 for FILE in "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}/"* |
| 159 | 213 do |
| 203 | 214 if [ "$(echo "${FILE}" | sed -e "${SED_GET_FILENAME};${SED_IS_MD5_FILE}" | grep -v ^$)" ]; then |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
215 printf "\nNot a valid danbooru file: $(echo ${FILE} | sed -e "${SED_GET_FILENAME}")\n${_last}" |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
216 else |
| 200 | 217 if [ "$(${MD5} "${FILE}" | cut -d ' ' -f1 -)" != "$(echo "${FILE}" | sed -e "${SED_GET_FILENAME}" | cut -d '.' -f1)" ] |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
218 then |
| 196 | 219 echo "${FILE}" >> "${TEMP_PREFIX}-error" |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
220 echo |
| 200 | 221 echo "Error: $(echo "${FILE}" | sed -e "${SED_GET_FILENAME}")" |
|
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
222 fi |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
223 Progress_Anim |
| 148 | 224 fi |
| 225 done | |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
226 Progress_Done |
| 200 | 227 TOTAL_ERROR=$(echo $(wc -l < "${TEMP_PREFIX}-error")) |
| 170 | 228 if [ "${TOTAL_ERROR}" -eq 0 ]; then |
| 203 | 229 echo "All files OK" |
| 170 | 230 else |
| 203 | 231 printf "${TOTAL_ERROR} file(s) broken: removing..." |
| 196 | 232 cat "${TEMP_PREFIX}-error" | xargs rm |
| 203 | 233 echo " ${TOTAL_ERROR} file(s) removed" |
| 170 | 234 fi |
| 200 | 235 echo "$(Count_Files "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}") file(s) available locally" |
| 148 | 236 |
| 203 | 237 printf "Generating list of new files..." |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
238 Progress_Init |
| 148 | 239 # THE FILES |
| 159 | 240 #ls "../${TARGET_DIR}" | grep -vf "${TARGET_DIR}-error" > "${TARGET_DIR}-ok" |
|
156
d3b002fd944e
fix: my attempt at speeding up things failed. reverting back to trusty grep -vf
edhoprima
parents:
155
diff
changeset
|
241 # |
| 200 | 242 find "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}" | comm -1 -3 "${TEMP_PREFIX}-error" - | sed -e "${SED_GET_FILENAME}" > "${TEMP_PREFIX}-ok" |
|
201
30d2fb656029
scrapping grep -vf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
200
diff
changeset
|
243 cat "${TEMP_PREFIX}-list" > "${TEMP_PREFIX}-templist" |
| 203 | 244 while read -r IS_OK; do |
| 245 cat "${TEMP_PREFIX}-templist" | grep -v "${IS_OK}" > "${TEMP_PREFIX}-newlist" | |
| 246 cat "${TEMP_PREFIX}-newlist" > "${TEMP_PREFIX}-templist" | |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
247 Progress_Anim |
| 203 | 248 done < "${TEMP_PREFIX}-ok" |
|
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
249 Progress_Done |
| 203 | 250 #cat "${TEMP_PREFIX}-list" | egrep -vf "${TEMP_PREFIX}-ok" > "${TEMP_PREFIX}-newlist" |
| 198 | 251 echo "$(echo $(wc -l < "${TEMP_PREFIX}-newlist")) file(s) to be downloaded" |
| 159 | 252 |
| 148 | 253 else |
| 159 | 254 if [ "${ISQUICK}" ]; then |
| 152 | 255 echo "quick mode selected. Skipping check" |
| 256 else | |
| 257 echo "Empty local repository" | |
| 258 fi | |
| 200 | 259 cat "${TEMP_PREFIX}-list" > "${TEMP_PREFIX}-newlist" |
| 148 | 260 fi |
| 261 } | |
| 262 | |
| 159 | 263 # start downloading the images |
| 264 Fetch_Images() { | |
| 196 | 265 if [ "$(echo $(wc -l < "${TEMP_PREFIX}-newlist"))" -eq 0 ]; then |
| 148 | 266 echo "No new file" |
| 267 else | |
| 203 | 268 printf "Starting wget..." |
|
160
68227a30d0b3
forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
159
diff
changeset
|
269 cd "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}" |
| 196 | 270 wget -e continue=on -bi "${TEMP_PREFIX}-newlist" -o "${TEMP_PREFIX}.log" |
| 148 | 271 fi |
| 272 } | |
| 273 | |
| 159 | 274 # initialize base variables and initial command check |
| 275 Init(){ | |
| 276 # path initialization | |
|
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
277 [ "${ADDITIONAL_PATH}" ] && PATH="${ADDITIONAL_PATH}:${PATH}" |
| 159 | 278 export PATH |
|
158
cba73f6a96bb
grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents:
157
diff
changeset
|
279 |
| 159 | 280 # misc variables |
| 166 | 281 ISQUICK= |
| 282 ISNEW= | |
|
158
cba73f6a96bb
grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents:
157
diff
changeset
|
283 |
| 159 | 284 [ $# -lt 2 ] && Err_Help |
| 285 case "$1" in | |
|
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
286 check|fetch|quickfetch) |
| 159 | 287 echo "Starting..." |
| 288 JOB="$1" | |
| 289 ;; | |
| 290 *) | |
| 291 Err_Help | |
| 292 ;; | |
| 293 esac | |
| 294 shift | |
| 295 SITE= | |
|
185
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
296 TAGS= |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
297 while [ "${1}" ]; do |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
298 case "$1" in |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
299 -s|--site) |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
300 shift |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
301 SITE="$1" |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
302 ;; |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
303 -nc|--noclean) |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
304 NOCLEAN=1 |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
305 ;; |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
306 *) |
| 186 | 307 if [ "${TAGS}" ]; then |
| 308 TAGS="$1 ${TAGS}" | |
| 309 else | |
| 310 TAGS="$1" | |
| 311 fi | |
|
185
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
312 ;; |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
313 esac |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
314 shift |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
315 done |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
316 [ "${SITE}" ] || SITE="${DEFAULT_SITE}" |
|
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
317 [ "${TAGS}" ] || Err_Fatal "No tag specified" |
|
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
318 # Get base folder - default, current folder or fallback to ${HOME} |
|
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
319 [ "${BASE_DIR}" ] || BASE_DIR="${PWD}" |
|
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
320 [ "${BASE_DIR}" ] || BASE_DIR="{$HOME}" |
| 193 | 321 [ "$(echo "${BASE_DIR}" | cut -c1 | grep \/)" ] || BASE_DIR="/${BASE_DIR}" |
|
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
322 |
| 159 | 323 echo "Tags: ${TAGS}" |
| 324 # slash is not wanted for folder name | |
| 193 | 325 TARGET_DIR=$(echo "${TAGS}" | sed -e 's/\//_/g') |
| 326 SITE_DIR=$(echo "${SITE}" | sed -e 's/\/$//g;s/\//_/g') | |
|
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
327 TEMP_PREFIX="${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}" |
| 159 | 328 } |
| 148 | 329 |
|
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
330 # initialization |
| 159 | 331 Msg_Welcome |
| 332 Init "$@" | |
| 333 Check_Tools | |
| 334 Check_Folders | |
|
158
cba73f6a96bb
grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents:
157
diff
changeset
|
335 |
| 148 | 336 |
| 159 | 337 # let's do the job! |
| 338 case "${JOB}" in | |
|
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
339 check) |
| 159 | 340 Generate_Link |
| 341 Check_Files | |
| 148 | 342 ;; |
| 159 | 343 fetch) |
| 344 Generate_Link | |
| 345 Check_Files | |
| 346 Fetch_Images | |
| 347 ;; | |
| 348 quickfetch) | |
| 349 ISNEW=1 | |
| 350 ISQUICK=1 | |
| 351 Generate_Link | |
| 352 Check_Files | |
| 353 Fetch_Images | |
| 148 | 354 ;; |
| 355 esac |
