annotate moefetch.sh @ 181:d3b7927bdb2b

restructuring and add check if the xml is processed properly
author edhoprima@gmail.com <edhoprima@gmail.com>
date Sun, 28 Jun 2009 05:12:41 +0000
parents 8e6555aa8631
children d92dfe857047
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
148
edhoprima
parents:
diff changeset
1 #!/bin/sh
edhoprima
parents:
diff changeset
2
edhoprima
parents:
diff changeset
3 # Copyright (c) 2009, edogawaconan <me@myconan.net>
edhoprima
parents:
diff changeset
4 #
edhoprima
parents:
diff changeset
5 # Permission to use, copy, modify, and/or distribute this software for any
edhoprima
parents:
diff changeset
6 # purpose with or without fee is hereby granted, provided that the above
edhoprima
parents:
diff changeset
7 # copyright notice and this permission notice appear in all copies.
edhoprima
parents:
diff changeset
8 #
edhoprima
parents:
diff changeset
9 # THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
edhoprima
parents:
diff changeset
10 # WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
edhoprima
parents:
diff changeset
11 # MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
edhoprima
parents:
diff changeset
12 # ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
edhoprima
parents:
diff changeset
13 # WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
edhoprima
parents:
diff changeset
14 # ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
edhoprima
parents:
diff changeset
15 # OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
16 #
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
17 # Lots of bugs here. Use with care
148
edhoprima
parents:
diff changeset
18 # USE WITH CARE
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
19 #
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
20 # what it does: fetch every picture that has the specified TAGS.
148
edhoprima
parents:
diff changeset
21 # requirement: wget, libxslt, md5sum (or md5)
edhoprima
parents:
diff changeset
22
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
23 # program additional paths for: cut, sed, wc, MD5(sum), wget, xsltproc, grep
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
24 ADDITIONAL_PATH=
148
edhoprima
parents:
diff changeset
25
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
26 # custom md5 path with arguments, expected output: <32digit md5><space(s)><filename>
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
27 # Leave empty for "md5sum" (Linux, Solaris), "md5 -r" (*BSD)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
28 MD5=
148
edhoprima
parents:
diff changeset
29
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
30 # default server address. Danbooru only! I do not take responsibility of stupidity.
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
31 DEFAULT_SITE="moe.imouto.org"
148
edhoprima
parents:
diff changeset
32
edhoprima
parents:
diff changeset
33 # base directory. make sure it's writeable. I do not take responsibility if you don't own the folder and files as no check is done for this one.
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
34 # Structure is ${BASE_DIR}/<TAGS>
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
35 # Absolute path only.
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
36 # Leave empty to use whatever folder you're running this at
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
37 BASE_DIR=""
148
edhoprima
parents:
diff changeset
38
edhoprima
parents:
diff changeset
39 # not user modifiable from here
edhoprima
parents:
diff changeset
40
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
41 # useless welcome message. Also version
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
42 Msg_Welcome() {
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
43 MOEFETCHVERSION="0.1-beta2"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
44 cat <<EOF
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
45 moefetch ${MOEFETCHVERSION}
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
46 Copyright (c) 2009 edogawaconan <me@myconan.net>
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
47
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
48 EOF
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
49 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
50
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
51 # fatal error handler
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
52 Err_Fatal() {
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
53 echo "Fatal error: ${1}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
54 exit 1
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
55 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
56
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
57 # help message
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
58 Err_Help() {
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
59 cat <<EOF
177
4d7de9c3b98c whoops typo
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 176
diff changeset
60 moefetch.sh COMMAND [-s SITE_URL] TAGS
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
61
176
3d2ae9417273 even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 175
diff changeset
62 COMMAND:
3d2ae9417273 even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 175
diff changeset
63 (quick)fetch: do a complete update. Add prefix quick to skip file checking
3d2ae9417273 even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 175
diff changeset
64 check: get list of new files, clean up local folder and print total new files
175
5b7a154dbd21 cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 174
diff changeset
65
177
4d7de9c3b98c whoops typo
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 176
diff changeset
66 -s SITE_URL: Specify URL of the Danbooru powered site you want to leech from. Default is ${DEFAULT_SITE}
175
5b7a154dbd21 cosmetics fix for help message
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 174
diff changeset
67
176
3d2ae9417273 even more improvement
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 175
diff changeset
68 TAGS: Tags you want to download. Separated by spaces. Tag name follows standard Danbooru tagging scheme
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
69
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
70 EOF
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
71 exit 0
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
72 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
73
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
74 # generate link by transforming xml
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
75 Generate_Link() {
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
76 cd "${BASE_DIR}/temp"
148
edhoprima
parents:
diff changeset
77 echo
edhoprima
parents:
diff changeset
78 echo "Fetching xml file"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
79 wget "http://${SITE}/post/index.xml?tags=${TAGS}&offset=0&limit=100000" -O "${SITE_DIR}-${TARGET_DIR}-xml" -e continue=off
148
edhoprima
parents:
diff changeset
80 echo "Processing XML file..."
edhoprima
parents:
diff changeset
81 # xslt evilry
165
9495944e326b damn dollar
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 164
diff changeset
82 xsltproc - "${SITE_DIR}-${TARGET_DIR}-xml" <<EOF | sed 's/.*\(http.*\)\(\/[a-f0-9]\{32\}\).*\.\([jp][pn]g\)/\1\2.\3/g' | grep ^http > "${SITE_DIR}-${TARGET_DIR}-list"
148
edhoprima
parents:
diff changeset
83 <xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
edhoprima
parents:
diff changeset
84 <xsl:output method="xml" indent="yes"/>
edhoprima
parents:
diff changeset
85 <xsl:template match="post">
edhoprima
parents:
diff changeset
86 <xsl:value-of select="@file_url" />
edhoprima
parents:
diff changeset
87 </xsl:template>
edhoprima
parents:
diff changeset
88 </xsl:stylesheet>
edhoprima
parents:
diff changeset
89 EOF
181
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
90 NUMFILES=`echo \`wc -l < \"${SITE_DIR}-${TARGET_DIR}-list\" \``
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
91 [ "${NUMFILES}" -gt 0 ] || Err_Fatal "Error in processing list or no files can be found with specified tag(s) or site"
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
92 echo "${NUMFILES}" file(s) available on server"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
93 #output file: ${TARGET_DIR}-list
148
edhoprima
parents:
diff changeset
94 }
edhoprima
parents:
diff changeset
95
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
96 # check tools availability
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
97 Check_Tools() {
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
98 # verify all programs required do indeed exist
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
99 #MD5
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
100 if [ ! "${MD5}" ]; then
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
101 case `uname` in
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
102 *BSD) MD5="md5 -r";;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
103 Linux|SunOS) MD5="md5sum";;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
104 *) Fatal_Err "No known md5 tool for this platform. Please specify manually"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
105 esac
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
106 fi
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
107 MD5_COMMAND=`echo ${MD5} | cut -d' ' -f1`
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
108 # basic tools
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
109 COMMANDS="cut sed wc wget xsltproc xargs rm mkdir chown comm grep ${MD5_COMMAND}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
110 for COMMAND in ${COMMANDS}
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
111 do
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
112 COMMAND_CHECK=`command -v "${COMMAND}"`
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
113 [ "${COMMAND_CHECK}" ] || Err_Fatal "${COMMAND} doesn't exist in ${PATH}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
114 done
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
115
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
116 # grep checking
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
117 # originally created for workaround on solaris
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
118 #if [ `uname` = "SunOS" ]; then
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
119 FAIL=""
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
120 echo "blah" > superrandomtestfile
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
121 echo "blah" > superrandomtestfile.2
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
122 grep -f superrandomtestfile.2 superrandomtestfile > /dev/null 2>&1 || FAIL=1
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
123 rm -f superrandomtestfile superrandomtestfile.2
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
124 [ "${FAIL}" ] && Err_Fatal "Your grep is not compatible. Please install or set path of correct grep"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
125 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
126
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
127 # verify required folders exist and writeable
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
128 Check_Folders(){
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
129 [ -O "${BASE_DIR}" ] || Err_Fatal "You don't own ${BASE_DIR}. Please fix ${BASE_DIR}."
180
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 179
diff changeset
130 for FOLDER in temp trash deleted "${SITE_DIR}/${TARGET_DIR}"; do
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
131 if [ ! -d "${BASE_DIR}/${FOLDER}" ]; then
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
132 mkdir "${BASE_DIR}/${FOLDER}" || Err_Fatal "${FOLDER} folder creation failed"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
133 fi
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
134 if [ ! -O "${BASE_DIR}/${FOLDER}" ]; then
167
78ac6fd03e3a more fix
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 166
diff changeset
135 echo "You don't own the ${BASE_DIR}/${FOLDER}, applying globally writeable permission on it"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
136 chmod -R u=rwX,g=rwX,o=rwX "${BASE_DIR}/${FOLDER}" || Err_Fatal "Error changing ownership. This shouldn't happen"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
137 fi
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
138 done
167
78ac6fd03e3a more fix
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 166
diff changeset
139 [ `echo \`ls "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}" | wc -l\`` -eq 0 ] && ISNEW=1
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
140 # let's move to workdir
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
141 cd "${BASE_DIR}/temp"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
142 for i in error ok list newlist; do
161
52877e2849bb misc fix. These past commits wasn't actually tested
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 160
diff changeset
143 touch "${SITE_DIR}-${TARGET_DIR}-${i}" || Fatal_Err "Error creating ${TARGET_DIR}-${i}. This shouldn't happen"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
144 done
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
145 #
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
146 }
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
147
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
148 # check files correctness
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
149 Check_Files() {
166
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
150 if [ ! "${ISNEW}" ]; then
148
edhoprima
parents:
diff changeset
151 echo "Checking for errors..."
edhoprima
parents:
diff changeset
152 # THE FILES
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
153
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
154 # current dir: ${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
155 cd "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}"
173
2b7c8c1ecdfe better trash handler
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 172
diff changeset
156 TRASH_DIR="${SITE_DIR}-${TARGET_DIR}-`date -u +%Y%m%d-%H.%M`"
2b7c8c1ecdfe better trash handler
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 172
diff changeset
157 mkdir -p "${BASE_DIR}/trash/${TRASH_DIR}"
179
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
158 # FIXME FIXME FIXME FIXME FIXME FIXME
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
159 for TRASH in *
148
edhoprima
parents:
diff changeset
160 do
179
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
161 if [ -d "${TRASH}" ]; then
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
162 mv -f "${TRASH}" "${BASE_DIR}/trash/${TRASH_DIR}" || Err_Fatal "Error deleting files"
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
163 echo "Moved ${TRASH} to ${BASE_DIR}/trash/${TRASH_DIR}"
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
164 else
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
165 TRASH="`echo ${TRASH} | sed -e 's/\([0-9a-f]\{32\}.*\)//g' | grep -v ^$`"
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
166 if [ "${TRASH}" ]; then
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
167 mv -f "${TRASH}" "${BASE_DIR}/trash/${TRASH_DIR}" || Err_Fatal "Error deleting files"
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
168 echo "Moved ${TRASH} to ${BASE_DIR}/trash/${TRASH_DIR}"
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
169 fi
c132eb3ca841 improved folder checker
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 178
diff changeset
170 fi
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
171 done
173
2b7c8c1ecdfe better trash handler
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 172
diff changeset
172 [ "`ls "${BASE_DIR}/trash/${TRASH_DIR}"`" ] || rmdir "${BASE_DIR}/trash/${TRASH_DIR}"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
173 printf "" > "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-error"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
174 for FILE in *
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
175 do
170
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
176 if [ "`${MD5} "${FILE}" | cut -d ' ' -f1 -`" != "`echo "${FILE}" | cut -d '.' -f1`" ]
148
edhoprima
parents:
diff changeset
177 then
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
178 echo
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
179 echo "${FILE}" >> "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-error"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
180 echo "Error: ${FILE}"
148
edhoprima
parents:
diff changeset
181 fi
edhoprima
parents:
diff changeset
182 printf "."
edhoprima
parents:
diff changeset
183 done
edhoprima
parents:
diff changeset
184 echo
178
3f5ee8b2791f error when restructuring
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 177
diff changeset
185 TOTAL_ERROR=`echo \`wc -l < "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-error"\``
3f5ee8b2791f error when restructuring
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 177
diff changeset
186 echo "${TOTAL_ERROR} file(s) error"
170
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
187 echo "Removing error files"
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
188 if [ "${TOTAL_ERROR}" -eq 0 ]; then
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
189 echo "No error file. 0 file removed"
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
190 else
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
191 cat "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-error" | xargs rm
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
192 echo "${TOTAL_ERROR} file(s) removed"
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
193 fi
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
194 echo "`echo \`ls | wc -l\`` file(s) available locally"
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 169
diff changeset
195
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
196 # current dir: ${BASE_DIR}/temp
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
197 cd ${BASE_DIR}/temp
148
edhoprima
parents:
diff changeset
198
edhoprima
parents:
diff changeset
199 echo "Generating list of new files..."
edhoprima
parents:
diff changeset
200 # THE FILES
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
201 #ls "../${TARGET_DIR}" | grep -vf "${TARGET_DIR}-error" > "${TARGET_DIR}-ok"
156
d3b002fd944e fix: my attempt at speeding up things failed. reverting back to trusty grep -vf
edhoprima
parents: 155
diff changeset
202 #
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
203 ls "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}" | comm -1 -3 "${SITE_DIR}-${TARGET_DIR}-error" - > "${SITE_DIR}-${TARGET_DIR}-ok"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
204 cat "${SITE_DIR}-${TARGET_DIR}-list" | grep -vf "${SITE_DIR}-${TARGET_DIR}-ok" > "${SITE_DIR}-${TARGET_DIR}-newlist"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
205 echo "`echo \`wc -l < \"${SITE_DIR}-${TARGET_DIR}-newlist\"\`` file(s) to be downloaded"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
206
148
edhoprima
parents:
diff changeset
207 else
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
208 if [ "${ISQUICK}" ]; then
152
67df02877319 added quickfetch for skipping file checking
edhoprima
parents: 151
diff changeset
209 echo "quick mode selected. Skipping check"
67df02877319 added quickfetch for skipping file checking
edhoprima
parents: 151
diff changeset
210 else
67df02877319 added quickfetch for skipping file checking
edhoprima
parents: 151
diff changeset
211 echo "Empty local repository"
67df02877319 added quickfetch for skipping file checking
edhoprima
parents: 151
diff changeset
212 fi
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
213 cd "${BASE_DIR}/temp"
166
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
214 cat "${SITE_DIR}-${TARGET_DIR}-list" > "${SITE_DIR}-${TARGET_DIR}-newlist"
148
edhoprima
parents:
diff changeset
215 fi
edhoprima
parents:
diff changeset
216 }
edhoprima
parents:
diff changeset
217
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
218 # start downloading the images
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
219 Fetch_Images() {
160
68227a30d0b3 forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 159
diff changeset
220 cd "${BASE_DIR}/temp"
68227a30d0b3 forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 159
diff changeset
221 if [ `echo \`wc -l < "${SITE_DIR}-${TARGET_DIR}-newlist"\`` -eq 0 ]; then
148
edhoprima
parents:
diff changeset
222 echo "No new file"
edhoprima
parents:
diff changeset
223 else
edhoprima
parents:
diff changeset
224 echo "Starting wget"
160
68227a30d0b3 forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 159
diff changeset
225 cd "${BASE_DIR}/${SITE_DIR}/${TARGET_DIR}"
68227a30d0b3 forgot to fix Fetch_Images to reflect new folder naming scheme
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 159
diff changeset
226 wget -e continue=on -bi "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}-newlist" -o "${BASE_DIR}/temp/${SITE_DIR}-${TARGET_DIR}.log"
148
edhoprima
parents:
diff changeset
227 fi
edhoprima
parents:
diff changeset
228 }
edhoprima
parents:
diff changeset
229
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
230 # initialize base variables and initial command check
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
231 Init(){
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
232 # path initialization
181
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
233 [ "${ADDITIONAL_PATH}" ] && PATH="${ADDITIONAL_PATH}:${PATH}"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
234 export PATH
158
cba73f6a96bb grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents: 157
diff changeset
235
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
236 # misc variables
166
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
237 ISQUICK=
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
238 ISNEW=
158
cba73f6a96bb grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents: 157
diff changeset
239
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
240 [ $# -lt 2 ] && Err_Help
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
241 case "$1" in
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
242 check|fetch|quickfetch)
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
243 echo "Starting..."
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
244 JOB="$1"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
245 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
246 *)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
247 Err_Help
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
248 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
249 esac
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
250 shift
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
251 SITE=
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
252 case "$1" in
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
253 -s|--site)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
254 shift
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
255 SITE="$1"
163
e2149ba6ab9c shift placed at wrong place.
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 162
diff changeset
256 shift
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
257 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
258 *)
161
52877e2849bb misc fix. These past commits wasn't actually tested
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 160
diff changeset
259 SITE="${DEFAULT_SITE}"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
260 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
261 esac
181
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
262 # Get base folder - default, current folder or fallback to ${HOME}
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
263 [ "${BASE_DIR}" ] || BASE_DIR="${PWD}"
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
264 [ "${BASE_DIR}" ] || BASE_DIR="{$HOME}"
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
265 [ "`echo ${BASE_DIR} | cut -c1 | grep \/`" ] || BASE_DIR="/${BASE_DIR}"
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
266
166
cc60e8cf7793 dunno :<
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 165
diff changeset
267 TAGS="$@"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
268 echo "Tags: ${TAGS}"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
269 # slash is not wanted for folder name
162
1f937c2e8b3f tags doesn't get parsed :(
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 161
diff changeset
270 TARGET_DIR="`echo "${TAGS}" | sed -e 's/\//_/g'`"
1f937c2e8b3f tags doesn't get parsed :(
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 161
diff changeset
271 SITE_DIR="`echo "${SITE}" | sed -e 's/\/$//g;s/\//_/g'`"
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
272 }
148
edhoprima
parents:
diff changeset
273
181
d3b7927bdb2b restructuring and add check if the xml is processed properly
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 180
diff changeset
274 # initialization
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
275 Msg_Welcome
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
276 Init "$@"
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
277 Check_Tools
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
278 Check_Folders
158
cba73f6a96bb grep check. OpenSolaris' default grep doesn't support -f
edhoprima
parents: 157
diff changeset
279
148
edhoprima
parents:
diff changeset
280
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
281 # let's do the job!
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
282 case "${JOB}" in
174
0948e76a57a1 added help. Bump to 0.1-beta2
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 173
diff changeset
283 check)
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
284 Generate_Link
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
285 Check_Files
148
edhoprima
parents:
diff changeset
286 ;;
159
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
287 fetch)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
288 Generate_Link
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
289 Check_Files
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
290 Fetch_Images
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
291 ;;
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
292 quickfetch)
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
293 ISNEW=1
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
294 ISQUICK=1
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
295 Generate_Link
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
296 Check_Files
75fe19903b74 Major cleanup
edhoprima@gmail.com <edhoprima@gmail.com>
parents: 158
diff changeset
297 Fetch_Images
148
edhoprima
parents:
diff changeset
298 ;;
edhoprima
parents:
diff changeset
299 esac