]>
Wikimedia Canada | Git repositories - eccc_to_commons.git/blob - mediawiki_post.sh
3 # mediawiki_post - Recursively send files in a directory to a Mediawiki instance
4 # Copyright (C) 2020 Pierre Choffet
6 # This program is free software: you can redistribute it and/or modify
7 # it under the terms of the GNU General Public License as published by
8 # the Free Software Foundation, either version 3 of the License, or
9 # (at your option) any later version.
11 # This program is distributed in the hope that it will be useful,
12 # but WITHOUT ANY WARRANTY; without even the implied warranty of
13 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 # GNU General Public License for more details.
16 # You should have received a copy of the GNU General Public License
17 # along with this program. If not, see <http://www.gnu.org/licenses/>.
22 ENDPOINT
='https://commons.wikimedia.org/w/api.php'
24 UPLOAD_MAX_RATE
=15 # Per minute
25 RESTART_AFTER_PATH
='' # i.e. weather.gc.ca/Monthly/1013241.tab
27 USERNAME_PATH
='login_username'
28 PASSWORD_PATH
='login_password'
29 LOGIN_TOKEN_PATH
='login_token'
30 CSRF_TOKEN_PATH
='csrf_token'
31 COOKIE_JAR
='cookie_jar'
36 LOGIN_TOKEN
=$(cat "${LOGIN_TOKEN_PATH}")
37 LOGIN_TOKEN
="${LOGIN_TOKEN/+/%2B}"
38 LOGIN_TOKEN
="${LOGIN_TOKEN/\\/%5C}"
42 CSRF_TOKEN
=$(cat "${CSRF_TOKEN_PATH}")
43 CSRF_TOKEN
="${CSRF_TOKEN/+/%2B}"
44 CSRF_TOKEN
="${CSRF_TOKEN/\\/%5C}"
48 local -r body
=$
(curl
-X POST
-d 'action=query' -d 'meta=tokens' -d 'type=login' \
49 -d 'format=xml' -b "${COOKIE_JAR}" -c "${COOKIE_JAR}" "${ENDPOINT}")
50 local -r login_token
="$(echo "${body}" | xmlstarlet sel -t -v //tokens/@logintoken -)"
55 local -r body
=$
(curl
-X POST
-d 'action=query' -d 'meta=tokens' \
56 -d 'format=xml' -b "${COOKIE_JAR}" -c "${COOKIE_JAR}" "${ENDPOINT}")
57 local -r csrf_token
="$(echo "${body}" | xmlstarlet sel -t -v //tokens/@csrftoken -)"
62 if [ ! -f "${LOGIN_TOKEN_PATH}" ]
64 requestLoginToken
> "${LOGIN_TOKEN_PATH}"
69 if [ ! -f "${USERNAME_PATH}" ]||[ ! -f "${PASSWORD_PATH}" ]
71 echo "What wiki account to use?"
72 read -p 'Username: ' USERNAME
73 read -sp 'Password: ' PASSWORD
75 USERNAME
="$(cat "${USERNAME_PATH}")"
76 PASSWORD
="$(cat "${PASSWORD_PATH}")"
79 local -r body
=$(curl -X POST -d 'action=login' --data-urlencode "lgname=${USERNAME}" --data-urlencode "lgpassword=${PASSWORD}" -d "lgtoken=${LOGIN_TOKEN}" -d 'format=xml' -b "${COOKIE_JAR}" -c "${COOKIE_JAR}" "${ENDPOINT}")
80 local -r result
=$(echo "${body}" | xmlstarlet sel -t -v '//login/@result' -)
84 requestLoginToken
> "${LOGIN_TOKEN_PATH}"
88 echo "${USERNAME}" > "${USERNAME_PATH}"
89 echo "${PASSWORD}" > "${PASSWORD_PATH}"
93 echo 'Login failed. Wrong credentials?'
97 echo "Unknown login result: ${result}. Exiting."
102 if [ -z "${SOURCE}" ]
104 echo 'Upload files to Mediawiki.'
105 echo 'Usage: mediawiki_post.sh <source folder>'
111 requestCSRFToken
> "${CSRF_TOKEN_PATH}"
114 # Prepare start offset
115 if [ "${RESTART_AFTER_PATH}" == '' ]
117 START_OFFSET_REACHED
=1
119 START_OFFSET_REACHED
=0
125 while IFS
= read -r -d '' -u 9
128 URI_PATH
=${NAMESPACE}:$(realpath --relative-to="${SOURCE}" "${REPLY}")
131 if [ ${START_OFFSET_REACHED} -eq 0 ]
133 if [ ${URI_PATH} == "${NAMESPACE}:${RESTART_AFTER_PATH}" ]
135 START_OFFSET_REACHED
=1
142 BODY
=$(curl -X POST -d 'action=edit' --data-urlencode "title=${URI_PATH}" --data-urlencode "text@${REPLY}" -d "token=${CSRF_TOKEN}" -d 'format=xml' -d 'bot=1' -b "${COOKIE_JAR}" -c "${COOKIE_JAR}" "${ENDPOINT}")
143 RESULT
=$(echo "${BODY}" | xmlstarlet sel -t -v '/api/edit/@result' -)
147 SECOND_NOW
=$(date +%S)
148 MINUTE_NOW
=$(date +%M)
149 MINUTE_UPLOADS
=$((MINUTE_UPLOADS+1))
151 if [ ${MINUTE_NOW} -ne ${MINUTE} ]
155 elif [ ${MINUTE_NOW} -eq ${MINUTE} ]&&[ ${MINUTE_UPLOADS} -eq ${UPLOAD_MAX_RATE} ]
157 sleep $((60-SECOND_NOW))
162 echo "Everything went right. Continue…"
165 echo "Unknown code: ${RESULT}. Exiting."
168 done 9< <( find "${SOURCE}" -type f
-name '*.tab' -print0 )