annotate moefetch.sh @ 178:3f5ee8b2791f

error when restructuring
author edhoprima@gmail.com <edhoprima@gmail.com>
date Fri, 05 Jun 2009 20:41:40 +0000
parents 4d7de9c3b98c
children c132eb3ca841
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
148
edhoprima
parents:
diff changeset
1 #!/bin/sh
edhoprima
parents:
diff changeset
2
edhoprima
parents:
diff changeset
3 # Copyright (c) 2009, edogawaconan <me@myconan.net>
edhoprima
parents:
diff changeset
4 #
edhoprima
parents:
diff changeset
5 # Permission to use, copy, modify, and/or distribute this software for any
edhoprima
parents:
diff changeset
6 # purpose with or without fee is hereby granted, provided that the above
edhoprima
parents:
diff changeset
7 # copyright notice and this permission notice appear in all copies.
edhoprima
parents:
diff changeset
8 #
edhoprima
parents:
diff changeset
9 # THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
edhoprima
parents:
diff changeset
10 # WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
edhoprima
parents:
diff changeset
11 # MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
edhoprima
parents:
diff changeset
12 # ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
edhoprima
parents:
diff changeset
13 # WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
edhoprima
parents:
diff changeset
14 # ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
edhoprima
parents:
diff changeset
15 # OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
16 #
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
17 # Lots of bugs here. Use with care
148
edhoprima
parents:
diff changeset
18 # USE WITH CARE
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
19 #
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
20 # what it does: fetch every picture that has the specified TAGS.
148
edhoprima
parents:
diff changeset
21 # requirement: wget, libxslt, md5sum (or md5)
edhoprima
parents:
diff changeset
22
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
23 # program additional paths for: cut, sed, wc, MD5(sum), wget, xsltproc, grep
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
24 ADDITIONAL_PATH=
148
edhoprima
parents:
diff changeset
25
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
26 # custom md5 path with arguments, expected output: <32digit md5><space(s)><filename>
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
27 # Leave empty for "md5sum" (Linux, Solaris), "md5 -r" (*BSD)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
28 MD5=
148
edhoprima
parents:
diff changeset
29
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
30 # default server address. Danbooru only! I do not take responsibility of stupidity.
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
31 DEFAULT_SITE="moe.imouto.org"
148
edhoprima
parents:
diff changeset
32
edhoprima
parents:
diff changeset
33 # base directory. make sure it's writeable. I do not take responsibility if you don't own the folder and files as no check is done for this one.
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
34 # Structure is ${BASE_DIR}/<TAGS>
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
35 # Absolute path only.
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
36 # Leave empty to use whatever folder you're running this at
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
37 BASE_DIR=""
148
edhoprima
parents:
diff changeset
38
edhoprima
parents:
diff changeset
39 # not user modifiable from here
edhoprima
parents:
diff changeset
40
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
41 # useless welcome message. Also version
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
42 Msg_Welcome() {
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
43 MOEFETCHVERSION="0.1-beta2"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
44 cat <<EOF
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
45 moefetch ${MOEFETCHVERSION}
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
46 Copyright (c) 2009 edogawaconan <me@myconan.net>
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
47
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
48 EOF
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
49 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
50
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
51 # fatal error handler
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
52 Err_Fatal() {
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
53 echo "Fatal error: ${1}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
54 exit 1
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
55 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
56
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
57 # help message
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
58 Err_Help() {
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
59 cat <<EOF
177
4d7de9c3b98c whoops typo
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 176
diff changeset
60 moefetch.sh COMMAND [-s SITE_URL] TAGS
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
61
176
3d2ae9417273 even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 175
diff changeset
62 COMMAND:
3d2ae9417273 even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 175
diff changeset
63 (quick)fetch: do a complete update. Add prefix quick to skip file checking
3d2ae9417273 even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 175
diff changeset
64 check: get list of new files, clean up local folder and print total new files
175
5b7a154dbd21 cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 174
diff changeset
65
177
4d7de9c3b98c whoops typo
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 176
diff changeset
66 -s SITE_URL: Specify URL of the Danbooru powered site you want to leech from. Default is ${DEFAULT_SITE}
175
5b7a154dbd21 cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 174
diff changeset
67
176
3d2ae9417273 even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 175
diff changeset
68 TAGS: Tags you want to download. Separated by spaces. Tag name follows standard Danbooru tagging scheme
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
69
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
70 EOF
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
71 exit 0
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
72 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
73
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
74 # generate link by transforming xml
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
75 Generate_Link() {
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
76 cd "${BASE_DIR}/temp"
148
edhoprima
parents:
diff changeset
77 echo
edhoprima
parents:
diff changeset
78 echo "Fetching xml file"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
79 wget "http://${SITE}/post/index.xml?tags=${TAGS}&offset=0&limit=100000" -O "${SITE_DIR}-${TARGET_DIR}-xml" -e continue=off
148
edhoprima
parents:
diff changeset
80 echo "Processing XML file..."
edhoprima
parents:
diff changeset
81 # xslt evilry
165
9495944e326b damn dollar
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 164
diff changeset
82 xsltproc - "${SITE_DIR}-${TARGET_DIR}-xml" <<EOF | sed 's/.*\(http.*\)\(\/[a-f0-9]\{32\}\).*\.\([jp][pn]g\)/\1\2.\3/g' | grep ^http > "${SITE_DIR}-${TARGET_DIR}-list"
148
edhoprima
parents:
diff changeset
83 <xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
edhoprima
parents:
diff changeset
84 <xsl:output method="xml" indent="yes"/>
edhoprima
parents:
diff changeset
85 <xsl:template match="post">
edhoprima
parents:
diff changeset
86 <xsl:value-of select="@file_url" />
edhoprima
parents:
diff changeset
87 </xsl:template>
edhoprima
parents:
diff changeset
88 </xsl:stylesheet>
edhoprima
parents:
diff changeset
89 EOF
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
90 echo "`echo \`wc -l < \"${SITE_DIR}-${TARGET_DIR}-list\" \`` file(s) available on server"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
91 #output file: ${TARGET_DIR}-list
148
edhoprima
parents:
diff changeset
92 }
edhoprima
parents:
diff changeset
93
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
94 # check tools availability
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
95 Check_Tools() {
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
96 # verify all programs required do indeed exist
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
97 #MD5
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
98 if [ ! "${MD5}" ]; then
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
99 case `uname` in
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
100 *BSD) MD5="md5 -r";;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
101 Linux|SunOS) MD5="md5sum";;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
102 *) Fatal_Err "No known md5 tool for this platform. Please specify manually"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
103 esac
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
104 fi
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
105 MD5_COMMAND=`echo ${MD5} | cut -d' ' -f1`
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
106 # basic tools
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
107 COMMANDS="cut sed wc wget xsltproc xargs rm mkdir chown comm grep ${MD5_COMMAND}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
108 for COMMAND in ${COMMANDS}
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
109 do
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
110 COMMAND_CHECK=`command -v "${COMMAND}"`
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
111 [ "${COMMAND_CHECK}" ] || Err_Fatal "${COMMAND} doesn't exist in ${PATH}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
112 done
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
113
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
114 # grep checking
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
115 # originally created for workaround on solaris
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
116 #if [ `uname` = "SunOS" ]; then
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
117 FAIL=""
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
118 echo "blah" > superrandomtestfile
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
119 echo "blah" > superrandomtestfile.2
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
120 grep -f superrandomtestfile.2 superrandomtestfile > /dev/null 2>&1 || FAIL=1
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
121 rm -f superrandomtestfile superrandomtestfile.2
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
122 [ "${FAIL}" ] && Err_Fatal "Your grep is not compatible. Please install or set path of correct grep"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
123 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
124
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
125 # verify required folders exist and writeable
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
126 Check_Folders(){
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
127 [ -O "${BASE_DIR}" ] || Err_Fatal "You don't own ${BASE_DIR}. Please fix ${BASE_DIR}."
167
78ac6fd03e3a more fix
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 166
diff changeset
128 for FOLDER in temp trash deleted ${SITE_DIR}/${TARGET_DIR}
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
129 do
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
130 if [ ! -d "${BASE_DIR}/${FOLDER}" ]; then
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
131 mkdir "${BASE_DIR}/${FOLDER}" || Err_Fatal "${FOLDER} folder creation failed"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
132 fi
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
133 if [ ! -O "${BASE_DIR}/${FOLDER}" ]; then
167
78ac6fd03e3a more fix
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 166
diff changeset
134 echo "You don't own the ${BASE_DIR}/${FOLDER}, applying globally writeable permission on it"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
135 chmod -R u=rwX,g=rwX,o=rwX "${BASE_DIR}/${FOLDER}" || Err_Fatal "Error changing ownership. This shouldn't happen"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
136 fi
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
137 done
167
78ac6fd03e3a more fix
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 166
diff changeset
138 [ `echo \`ls "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}" | wc -l\`` -eq 0 ] && ISNEW=1
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
139 # let's move to workdir
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
140 cd "${BASE_DIR}/temp"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
141 for i in error ok list newlist; do
161
52877e2849bb misc fix. These past commits wasn't actually tested
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 160
diff changeset
142 touch "${SITE_DIR}-${TARGET_DIR}-${i}" || Fatal_Err "Error creating ${TARGET_DIR}-${i}. This shouldn't happen"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
143 done
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
144 #
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
145 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
146
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
147 # check files correctness
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
148 Check_Files() {
166
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
149 if [ ! "${ISNEW}" ]; then
148
edhoprima
parents:
diff changeset
150 echo "Checking for errors..."
edhoprima
parents:
diff changeset
151 # THE FILES
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
152
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
153 # current dir: ${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
154 cd "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}"
173
2b7c8c1ecdfe better trash handler
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 172
diff changeset
155 TRASH_DIR="${SITE_DIR}-${TARGET_DIR}-`date -u +%Y%m%d-%H.%M`"
2b7c8c1ecdfe better trash handler
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 172
diff changeset
156 mkdir -p "${BASE_DIR}/trash/${TRASH_DIR}"
172
30de37b6fe47 lol wut
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 171
diff changeset
157 for TRASH in `ls | sed -e 's/\([0-9a-f]\{32\}.*\)//g' | grep -v ^$`
148
edhoprima
parents:
diff changeset
158 do
173
2b7c8c1ecdfe better trash handler
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 172
diff changeset
159 mv -f "${TRASH}" "${BASE_DIR}/trash/${TRASH_DIR}" || Err_Fatal "Error deleting files"
2b7c8c1ecdfe better trash handler
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 172
diff changeset
160 echo "Moved ${TRASH} to ${BASE_DIR}/trash/${TRASH_DIR}"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
161 done
173
2b7c8c1ecdfe better trash handler
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 172
diff changeset
162 [ "`ls "${BASE_DIR}/trash/${TRASH_DIR}"`" ] || rmdir "${BASE_DIR}/trash/${TRASH_DIR}"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
163 printf "" > "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-error"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
164 for FILE in *
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
165 do
170
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
166 if [ "`${MD5} "${FILE}" | cut -d ' ' -f1 -`" != "`echo "${FILE}" | cut -d '.' -f1`" ]
148
edhoprima
parents:
diff changeset
167 then
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
168 echo
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
169 echo "${FILE}" >> "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-error"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
170 echo "Error: ${FILE}"
148
edhoprima
parents:
diff changeset
171 fi
edhoprima
parents:
diff changeset
172 printf "."
edhoprima
parents:
diff changeset
173 done
edhoprima
parents:
diff changeset
174 echo
178
3f5ee8b2791f error when restructuring
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 177
diff changeset
175 TOTAL_ERROR=`echo \`wc -l < "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-error"\``
3f5ee8b2791f error when restructuring
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 177
diff changeset
176 echo "${TOTAL_ERROR} file(s) error"
170
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
177 echo "Removing error files"
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
178 if [ "${TOTAL_ERROR}" -eq 0 ]; then
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
179 echo "No error file. 0 file removed"
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
180 else
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
181 cat "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-error" | xargs rm
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
182 echo "${TOTAL_ERROR} file(s) removed"
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
183 fi
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
184 echo "`echo \`ls | wc -l\`` file(s) available locally"
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
185
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
186 # current dir: ${BASE_DIR}/temp
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
187 cd ${BASE_DIR}/temp
148
edhoprima
parents:
diff changeset
188
edhoprima
parents:
diff changeset
189 echo "Generating list of new files..."
edhoprima
parents:
diff changeset
190 # THE FILES
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
191 #ls "../${TARGET_DIR}" | grep -vf "${TARGET_DIR}-error" > "${TARGET_DIR}-ok"
156
d3b002fd944e fix: my attempt at speeding up things failed. reverting back to trusty grep -vf
edhoprima
parents: 155
diff changeset
192 #
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
193 ls "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}" | comm -1 -3 "${SITE_DIR}-${TARGET_DIR}-error" - > "${SITE_DIR}-${TARGET_DIR}-ok"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
194 cat "${SITE_DIR}-${TARGET_DIR}-list" | grep -vf "${SITE_DIR}-${TARGET_DIR}-ok" > "${SITE_DIR}-${TARGET_DIR}-newlist"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
195 echo "`echo \`wc -l < \"${SITE_DIR}-${TARGET_DIR}-newlist\"\`` file(s) to be downloaded"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
196
148
edhoprima
parents:
diff changeset
197 else
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
198 if [ "${ISQUICK}" ]; then
152
67df02877319 added quickfetch for skipping file checking
edhoprima
parents: 151
diff changeset
199 echo "quick mode selected. Skipping check"
67df02877319 added quickfetch for skipping file checking
edhoprima
parents: 151
diff changeset
200 else
67df02877319 added quickfetch for skipping file checking
edhoprima
parents: 151
diff changeset
201 echo "Empty local repository"
67df02877319 added quickfetch for skipping file checking
edhoprima
parents: 151
diff changeset
202 fi
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
203 cd "${BASE_DIR}/temp"
166
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
204 cat "${SITE_DIR}-${TARGET_DIR}-list" > "${SITE_DIR}-${TARGET_DIR}-newlist"
148
edhoprima
parents:
diff changeset
205 fi
edhoprima
parents:
diff changeset
206 }
edhoprima
parents:
diff changeset
207
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
208 # start downloading the images
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
209 Fetch_Images() {
160
68227a30d0b3 forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 159
diff changeset
210 cd "${BASE_DIR}/temp"
68227a30d0b3 forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 159
diff changeset
211 if [ `echo \`wc -l < "${SITE_DIR}-${TARGET_DIR}-newlist"\`` -eq 0 ]; then
148
edhoprima
parents:
diff changeset
212 echo "No new file"
edhoprima
parents:
diff changeset
213 else
edhoprima
parents:
diff changeset
214 echo "Starting wget"
160
68227a30d0b3 forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 159
diff changeset
215 cd "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}"
68227a30d0b3 forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 159
diff changeset
216 wget -e continue=on -bi "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-newlist" -o "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}.log"
148
edhoprima
parents:
diff changeset
217 fi
edhoprima
parents:
diff changeset
218 }
edhoprima
parents:
diff changeset
219
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
220 # initialize base variables and initial command check
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
221 Init(){
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
222 # Get base folder - current folder or fallback to ${HOME}
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
223 [ "${BASE_DIR}" ] || BASE_DIR="${PWD}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
224 [ "${BASE_DIR}" ] || BASE_DIR="{$HOME}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
225 [ "`echo ${BASE_DIR} | cut -c1 | grep \/`" ] || BASE_DIR="/${BASE_DIR}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
226 # path initialization
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
227 [ "${ADDITIONAL_PATH}" ] && PATH=${ADDITIONAL_PATH}:${PATH}
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
228 export PATH
158
cba73f6a96bb grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents: 157
diff changeset
229
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
230 # misc variables
166
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
231 ISQUICK=
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
232 ISNEW=
158
cba73f6a96bb grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents: 157
diff changeset
233
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
234 [ $# -lt 2 ] && Err_Help
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
235 case "$1" in
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
236 check|fetch|quickfetch)
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
237 echo "Starting..."
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
238 JOB="$1"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
239 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
240 *)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
241 Err_Help
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
242 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
243 esac
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
244 shift
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
245 SITE=
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
246 case "$1" in
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
247 -s|--site)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
248 shift
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
249 SITE="$1"
163
e2149ba6ab9c shift placed at wrong place.
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 162
diff changeset
250 shift
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
251 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
252 *)
161
52877e2849bb misc fix. These past commits wasn't actually tested
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 160
diff changeset
253 SITE="${DEFAULT_SITE}"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
254 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
255 esac
166
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
256 TAGS="$@"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
257 echo "Tags: ${TAGS}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
258 # slash is not wanted for folder name
162
1f937c2e8b3f tags doesn't get parsed :(
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 161
diff changeset
259 TARGET_DIR="`echo "${TAGS}" | sed -e 's/\//_/g'`"
1f937c2e8b3f tags doesn't get parsed :(
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 161
diff changeset
260 SITE_DIR="`echo "${SITE}" | sed -e 's/\/$//g;s/\//_/g'`"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
261 }
148
edhoprima
parents:
diff changeset
262
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
263 Msg_Welcome
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
264 Init "$@"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
265 Check_Tools
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
266 Check_Folders
158
cba73f6a96bb grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents: 157
diff changeset
267
148
edhoprima
parents:
diff changeset
268
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
269 # let's do the job!
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
270 case "${JOB}" in
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
271 check)
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
272 Generate_Link
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
273 Check_Files
148
edhoprima
parents:
diff changeset
274 ;;
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
275 fetch)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
276 Generate_Link
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
277 Check_Files
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
278 Fetch_Images
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
279 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
280 quickfetch)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
281 ISNEW=1
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
282 ISQUICK=1
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
283 Generate_Link
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
284 Check_Files
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
285 Fetch_Images
148
edhoprima
parents:
diff changeset
286 ;;
edhoprima
parents:
diff changeset
287 esac