Mercurial > ec-dotfiles
annotate moefetch.sh @ 225:265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
- Preparation for name-safe file operations.
- Sanity against sed
- Correctly encoded url (hopefully)
- getopts replacing fail hackjob with while and shift
- support for login (provided with openssl)
author | edhoprima |
---|---|
date | Fri, 13 Nov 2009 18:47:02 +0000 |
parents | 0ac1805621d4 |
children | f8be4a3d3b4a |
rev | line source |
---|---|
221
e891b563b797
wrong rule caused mass headache
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
220
diff
changeset
|
1 #!/bin/sh |
148 | 2 |
3 # Copyright (c) 2009, edogawaconan <me@myconan.net> | |
4 # | |
5 # Permission to use, copy, modify, and/or distribute this software for any | |
6 # purpose with or without fee is hereby granted, provided that the above | |
7 # copyright notice and this permission notice appear in all copies. | |
8 # | |
9 # THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES | |
10 # WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF | |
11 # MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR | |
12 # ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES | |
13 # WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN | |
14 # ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF | |
15 # OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. | |
159 | 16 # |
17 # Lots of bugs here. Use with care | |
148 | 18 # USE WITH CARE |
159 | 19 # |
20 # what it does: fetch every picture that has the specified TAGS. | |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
21 # requirement: wget, libxslt, openssl |
148 | 22 |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
23 # program additional paths for: cut, sed, wc, openssl, wget, xsltproc, grep |
159 | 24 ADDITIONAL_PATH= |
148 | 25 |
159 | 26 # default server address. Danbooru only! I do not take responsibility of stupidity. |
27 DEFAULT_SITE="moe.imouto.org" | |
148 | 28 |
29 # base directory. make sure it's writeable. I do not take responsibility if you don't own the folder and files as no check is done for this one. | |
159 | 30 # Structure is ${BASE_DIR}/<TAGS> |
31 # Absolute path only. | |
32 # Leave empty to use whatever folder you're running this at | |
193 | 33 BASE_DIR= |
148 | 34 |
35 # not user modifiable from here | |
36 | |
193 | 37 ### TODO: |
211 | 38 ### - sanity validator(?) |
193 | 39 ### - unified repository to save bandwidth |
40 ### - bug stomping | |
41 ### - sanity checking | |
42 ### WILL BE FOR 0.3 | |
43 | |
159 | 44 # useless welcome message. Also version |
45 Msg_Welcome() { | |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
46 MOEFETCHVERSION="0.3-beta2" |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
47 echo "moefetch ${MOEFETCHVERSION} |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
48 Copyright (c) 2009 edogawaconan <me@myconan.net> |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
49 " |
159 | 50 } |
51 | |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
52 get_md5() { cat -- "$1" | openssl dgst -md5; } |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
53 get_basename() { basename -- "$1"; } |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
54 get_filename() { get_basename "${1%.*}"; } |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
55 get_cleantags() { printf "%s " "$@" | sed -e 's/\&/%26/g;s/=/%3D/g'; } |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
56 Is_NotMD5() { get_filename "$1" | sed -e 's/\([0-9a-f]\{32\}\)//g'; } |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
57 |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
58 |
159 | 59 # fatal error handler |
60 Err_Fatal() { | |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
61 echo " |
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
62 Fatal error: ${1}" |
159 | 63 exit 1 |
64 } | |
65 | |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
66 Err_Impossible() { |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
67 echo " |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
68 Impossible error. Or you modified content of the working directories when the script is running. |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
69 Please report to moefetch.googlecode.com if you see this message (complete with entire run log)" |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
70 exit 1 |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
71 } |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
72 |
159 | 73 # help message |
74 Err_Help() { | |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
75 echo "moefetch.sh COMMAND [-s SITE_URL] TAGS |
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
76 |
176
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
77 COMMAND: |
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
78 (quick)fetch: do a complete update. Add prefix quick to skip file checking |
3d2ae9417273
even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
175
diff
changeset
|
79 check: get list of new files, clean up local folder and print total new files |
175
5b7a154dbd21
cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
174
diff
changeset
|
80 |
177 | 81 -s SITE_URL: Specify URL of the Danbooru powered site you want to leech from. Default is ${DEFAULT_SITE} |
175
5b7a154dbd21
cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
174
diff
changeset
|
82 |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
83 TAGS: Tags you want to download. Separated by spaces. Tag name follows standard Danbooru tagging scheme" |
193 | 84 exit 2 |
159 | 85 } |
86 | |
87 # generate link by transforming xml | |
88 Generate_Link() { | |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
89 echo " |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
90 Fetching XML file" |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
91 tempnum=1000 |
224 | 92 iternum=1 |
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
93 > "${TEMP_PREFIX}-list" |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
94 while [ "${tempnum}" -ge 1000 ]; do |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
95 wget "http://${SITE}/post/index.xml?tags=$(get_cleantags "${TAGS}")&offset=0&limit=1000&page=${iternum}&login=${LOGIN_USER}&password_hash=${LOGIN_PASS}" -O "${TEMP_PREFIX}-xml" -e continue=off |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
96 printf "Processing XML file... " |
213
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
97 # xslt evilry |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
98 xsltproc - "${TEMP_PREFIX}-xml" <<EOF | sed 's/.*\(http.*\)\(\/[a-f0-9]\{32\}\).*\.\([^\.]*\)/\1\2.\3/g' | grep ^http > "${TEMP_PREFIX}-templist" |
148 | 99 <xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0"> |
100 <xsl:output method="xml" indent="yes"/> | |
101 <xsl:template match="post"> | |
102 <xsl:value-of select="@file_url" /> | |
103 </xsl:template> | |
104 </xsl:stylesheet> | |
105 EOF | |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
106 tempnum=$(echo $(wc -l < "${TEMP_PREFIX}-templist")) |
224 | 107 iternum=$((iternum + 1)) |
213
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
108 cat "${TEMP_PREFIX}-templist" >> "${TEMP_PREFIX}-list" |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
109 echo "${tempnum} file(s) available" |
213
dd95cf01602c
working around limit
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
212
diff
changeset
|
110 done |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
111 numfiles=$(echo $(wc -l < "${TEMP_PREFIX}-list")) |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
112 echo "${numfiles} file(s) available on server" |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
113 [ "${numfiles}" -gt 0 ] || Err_Fatal "Error in processing list or no files can be found with specified tag(s) or site." |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
114 } |
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
115 |
148 | 116 |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
117 Progress_Init() { |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
118 _last="-" |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
119 printf "${_last}" |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
120 } |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
121 |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
122 Progress_Anim() { |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
123 case "${_last}" in |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
124 /) _last="-";; |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
125 -) _last=\\;; |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
126 \\) _last=\|;; |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
127 \|) _last="/";; |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
128 esac |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
129 printf "\b${_last}" |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
130 } |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
131 |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
132 Progress_Done() { printf "\bdone\n"; } |
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
133 |
200 | 134 # getting rid of ls (as per suggestion) |
135 Count_Files() { | |
224 | 136 numfiles=0 |
137 for dircontent in "${*}/"* "${*}/".*; do | |
138 if [ "${dircontent}" != "${*}/*" ] || [ -e "${dircontent}" ]; then | |
139 numfiles=$((numfiles + 1)) | |
200 | 140 fi |
141 done | |
224 | 142 echo $((numfiles - 2)) |
200 | 143 } |
144 | |
159 | 145 # check tools availability |
146 Check_Tools() { | |
147 # verify all programs required do indeed exist | |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
148 commands="cut sed wc wget xsltproc xargs rm mkdir chown comm grep date openssl" |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
149 for cmd in ${commands} |
159 | 150 do |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
151 [ "$(command -v "${cmd}")" ] || Err_Fatal "${cmd} doesn't exist in ${PATH}" |
159 | 152 done |
153 } | |
154 | |
155 # verify required folders exist and writeable | |
156 Check_Folders(){ | |
223 | 157 [ -O "${BASE_DIR}" ] || Err_Fatal "You don't own ${BASE_DIR}. Please fix ${BASE_DIR} or run this script in your own directory." |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
158 for directory in temp trash deleted "${SITE_DIR}/${TARGET_DIR}"; do |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
159 if [ ! -d "${BASE_DIR}/${directory}" ]; then |
216
a869987c4646
did I say 'mess up'?
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
215
diff
changeset
|
160 mkdir -p "${BASE_DIR}/${directory}" || Err_Impossible |
159 | 161 fi |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
162 if [ ! -O "${BASE_DIR}/${directory}" ]; then |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
163 echo "You don't own the ${BASE_DIR}/${directory}, applying globally writeable permission on it" |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
164 chmod -R u=rwX,g=rwX,o=rwX "${BASE_DIR}/${directory}" || Err_Impossible |
159 | 165 fi |
166 done | |
223 | 167 [ "$(Count_Files "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}")" -eq 0 ] && ISNEW=1 |
201
30d2fb656029
scrapping grep -vf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
200
diff
changeset
|
168 for i in error ok list newlist templist; do |
196 | 169 touch "${TEMP_PREFIX}-${i}" || Fatal_Err "Error creating ${TEMP_PREFIX}-${i}. This shouldn't happen" |
159 | 170 done |
171 # | |
172 } | |
173 | |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
174 # Do some cleanup |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
175 Cleanup_Repository() { |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
176 # current dir: ${BASE_DIR}/${SITE_DIR}/${TARGET_DIR} |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
177 printf "Cleaning up repository folder... " |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
178 Progress_Init |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
179 trash_dir="${BASE_DIR}/trash/${trash_dir}/$(date -u "+${SITE_DIR}-${TARGET_DIR}-%Y%m%d-%H.%M")" |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
180 trashes="These files have been moved to ${trash_dir}:" |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
181 has_trash= |
223 | 182 if [ ! -d "${trash_dir}" ]; then |
216
a869987c4646
did I say 'mess up'?
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
215
diff
changeset
|
183 mkdir -p "${trash_dir}" || Err_Impossible |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
184 else |
223 | 185 if [ ! -O "${trash_dir}" ]; then |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
186 chmod -R u=rwX,g=rwX,o=rwX "${BASE_DIR}/${directory}" || Err_Impossible |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
187 fi |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
188 fi |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
189 for trash in "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}/"* |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
190 do |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
191 is_trash= |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
192 if [ -d "${trash}" ] || [ -n "$(Is_NotMD5 "${trash}")" ] || [ -z "$(grep "$(get_basename "${trash}")" "${TEMP_PREFIX}-list")" ]; then |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
193 is_trash=1 |
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
194 has_trash=1 |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
195 mv -f -- "${trash}" "${trash_dir}" || Err_Impossible |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
196 trashes="${trashes} |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
197 $(get_basename "${trash}")" |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
198 fi |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
199 Progress_Anim |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
200 done |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
201 rmdir "${trash_dir}" 2>/dev/null |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
202 Progress_Done |
223 | 203 [ -n "${has_trash}" ] && echo "${trashes}" |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
204 } |
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
205 |
159 | 206 # check files correctness |
207 Check_Files() { | |
223 | 208 if [ ! -n "${ISNEW}" ]; then |
209 [ -z "${NOCLEAN}" ] && Cleanup_Repository | |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
210 printf "Checking for errors... " |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
211 Progress_Init |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
212 files_error="These files do not match its md5:" |
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
213 files_notdanbooru="These files are not checked:" |
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
214 has_err_filename= |
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
215 has_err_md5= |
196 | 216 > "${TEMP_PREFIX}-error" |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
217 > "${TEMP_PREFIX}-ok" |
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
218 for file in "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}/"* |
159 | 219 do |
223 | 220 if [ "${file}" != "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}/*" ]; then |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
221 if [ -n "$(Is_NotMD5 "${file}")" ] || [ -d "${file}" ]; then |
217 | 222 files_notdanbooru="${files_notdanbooru} |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
223 $(get_basename "${file}")" |
217 | 224 has_err_filename=1 |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
225 else |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
226 if [ "$(get_md5 "${file}")" = "$(get_filename "${file}")" ]; then |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
227 echo "$(get_basename "${file}")" >> "${TEMP_PREFIX}-ok" |
217 | 228 else |
229 rm "${file}" || Err_Fatal "Error removing ${file}" | |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
230 echo "$(get_basename "${file}")" >> "${TEMP_PREFIX}-error" |
217 | 231 files_error="${files_error} |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
232 $(get_basename "${file}")" |
217 | 233 has_err_md5=1 |
234 fi | |
187
efd957294c8c
refactoring. cleanup. etc.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
186
diff
changeset
|
235 fi |
148 | 236 fi |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
237 Progress_Anim |
148 | 238 done |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
239 Progress_Done |
223 | 240 if [ ! -n "${has_err_md5}" ] && [ ! -n "${has_err_filename}" ]; then |
203 | 241 echo "All files OK" |
170 | 242 else |
223 | 243 if [ -n "${has_err_md5}" ]; then |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
244 echo "${files_error}" |
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
245 echo "$(echo $(wc -l < "${TEMP_PREFIX}-error")) file(s) removed" |
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
246 fi |
223 | 247 [ -n "${has_err_filename}" ] && echo "${files_notdanbooru}" |
170 | 248 fi |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
249 echo "$(echo $(wc -l < "${TEMP_PREFIX}-ok")) file(s) available locally" |
148 | 250 |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
251 printf "Generating list of new files... " |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
252 Progress_Init |
218 | 253 cp -f "${TEMP_PREFIX}-list" "${TEMP_PREFIX}-templist" |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
254 while read -r is_ok; do |
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
255 grep -v "${is_ok}" "${TEMP_PREFIX}-templist" > "${TEMP_PREFIX}-newlist" |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
256 cp -f "${TEMP_PREFIX}-newlist" "${TEMP_PREFIX}-templist" || Err_Impossible |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
257 Progress_Anim |
203 | 258 done < "${TEMP_PREFIX}-ok" |
205
2e866999c042
now with useless animation
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
204
diff
changeset
|
259 Progress_Done |
214
a6624fb9b317
major cleanup. tweaking.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
213
diff
changeset
|
260 echo "$(echo $(wc -l < "${TEMP_PREFIX}-newlist")) file(s) to be downloaded" |
148 | 261 else |
223 | 262 if [ -n "${ISQUICK}" ]; then |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
263 echo "Quick mode selected. Skipping check" |
152 | 264 else |
265 echo "Empty local repository" | |
266 fi | |
200 | 267 cat "${TEMP_PREFIX}-list" > "${TEMP_PREFIX}-newlist" |
148 | 268 fi |
269 } | |
270 | |
159 | 271 # start downloading the images |
272 Fetch_Images() { | |
223 | 273 if [ "$(echo $(wc -l < "${TEMP_PREFIX}-newlist"))" -eq 0 ]; then |
148 | 274 echo "No new file" |
275 else | |
207
17d816a63b4c
final progress version
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
206
diff
changeset
|
276 printf "Starting wget... " |
160
68227a30d0b3
forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
159
diff
changeset
|
277 cd "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}" |
196 | 278 wget -e continue=on -bi "${TEMP_PREFIX}-newlist" -o "${TEMP_PREFIX}.log" |
148 | 279 fi |
280 } | |
281 | |
159 | 282 # initialize base variables and initial command check |
283 Init(){ | |
284 # path initialization | |
223 | 285 [ -n "${ADDITIONAL_PATH}" ] && PATH="${ADDITIONAL_PATH}:${PATH}" |
159 | 286 export PATH |
158
cba73f6a96bb
grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents:
157
diff
changeset
|
287 |
159 | 288 # misc variables |
166 | 289 ISQUICK= |
290 ISNEW= | |
215
710082ce6788
major cleanup part2.
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
214
diff
changeset
|
291 |
159 | 292 [ $# -lt 2 ] && Err_Help |
293 case "$1" in | |
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
294 check|fetch|quickfetch) |
159 | 295 echo "Starting..." |
296 JOB="$1" | |
297 ;; | |
298 *) | |
299 Err_Help | |
300 ;; | |
301 esac | |
302 shift | |
303 SITE= | |
185
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
304 TAGS= |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
305 x=1 |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
306 while getopts "s:(site)n(noclean)u:(user)p:(password)" opt |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
307 do |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
308 case "$opt" in |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
309 s) SITE="$OPTARG";; |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
310 n) NOCLEAN=1;; |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
311 p) LOGIN_PASS=$(printf "%s" "$OPTARG" | openssl dgst -sha1);; |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
312 u) LOGIN_USER="$OPTARG";; |
185
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
313 esac |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
314 x=${OPTIND} |
185
6d926d4b3c5a
initial clean system support
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
184
diff
changeset
|
315 done |
225
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
316 shift $(($x-1)) |
265a9ca47a19
- Replaced md5(sum) with openssl. Less platform dependent because the tool is same across platforms
edhoprima
parents:
224
diff
changeset
|
317 TAGS="$@" |
223 | 318 [ -n "${SITE}" ] || SITE=${DEFAULT_SITE} |
319 [ -n "${TAGS}" ] || Err_Fatal "No tag specified" | |
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
320 # Get base folder - default, current folder or fallback to ${HOME} |
223 | 321 [ -n "${BASE_DIR}" ] || BASE_DIR=${PWD} |
322 [ -n "${BASE_DIR}" ] || BASE_DIR=${HOME} | |
323 [ -n "$(echo "${BASE_DIR}" | cut -c1 | grep \/)" ] || BASE_DIR="/${BASE_DIR}" | |
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
324 |
159 | 325 echo "Tags: ${TAGS}" |
326 # slash is not wanted for folder name | |
193 | 327 TARGET_DIR=$(echo "${TAGS}" | sed -e 's/\//_/g') |
328 SITE_DIR=$(echo "${SITE}" | sed -e 's/\/$//g;s/\//_/g') | |
195
652d9e268cee
test migration to printf
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
194
diff
changeset
|
329 TEMP_PREFIX="${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}" |
159 | 330 } |
148 | 331 |
181
d3b7927bdb2b
restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
180
diff
changeset
|
332 # initialization |
159 | 333 Msg_Welcome |
334 Init "$@" | |
335 Check_Tools | |
336 Check_Folders | |
158
cba73f6a96bb
grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents:
157
diff
changeset
|
337 |
148 | 338 |
159 | 339 # let's do the job! |
340 case "${JOB}" in | |
174
0948e76a57a1
added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents:
173
diff
changeset
|
341 check) |
159 | 342 Generate_Link |
343 Check_Files | |
148 | 344 ;; |
159 | 345 fetch) |
346 Generate_Link | |
347 Check_Files | |
348 Fetch_Images | |
349 ;; | |
350 quickfetch) | |
351 ISNEW=1 | |
352 ISQUICK=1 | |
353 Generate_Link | |
354 Check_Files | |
355 Fetch_Images | |
148 | 356 ;; |
357 esac |