# 2025.02.24 - [pixeldrain] Update "The file is IP limited" response handling retry # 2025.02.22 - [blackcloud_onion] Add bcloud.onion download handling (url fixing) # 2025.02.21 - [anonfile] Update cdn link parsing to handle new subdomains # 2025.02.21 - [anonfile] Add download limit reached response handling # 2025.02.21 - [anonfile] Update file info retrieval (head no longer responds) # 2025.02.21 - [sendspace] Add sendspace.com as download host # 2025.02.21 - [oshi / up_oshi] Revert /nossl/ changes for oshi.at (clearnet)
315 lines
13 KiB
Bash
315 lines
13 KiB
Bash
#! Name: anonsharing.sh
|
|
#! Author: kittykat
|
|
#! Version: 2024.10.30
|
|
#! Desc: Add support for downloading and processing of urls for a new host
|
|
#! Usage: Copy this file into the ./${ScriptDir}/hosts/ folder
|
|
#!
|
|
#!
|
|
#! ------------ REQUIRED SECTION ---------------
|
|
#! @[UPDATE] HostAndDomainRegexes: This string is loaded into mad.sh and allows dynamic handling of new url data
|
|
#! Format: '/HostCode/HostNick/HostFuncPrefix:HostDomainRegex@'
|
|
#! HostCode: <aUniqueCodeForHost> (ie. 'fh' for filehaus -- cannot be used by other hosts)
|
|
#! HostNick: What is displayed throughout MAD output (ie. 'filehaus' -- "urls.txt has 10 filehaus.." will be displayed)
|
|
#! HostFuncPrefix: <aUniqueStringThatMustPrefixHostFunctions> (ie. 'fh' -- fh_DownloadFile(), fh_FetchFileInfo() .. )
|
|
#! * Note: Must begin with a letter a-z (functions beginning with numbers are no bueno)
|
|
#! HostDomainRegex: The regex used to verify matching urls
|
|
HostCode='ansh'
|
|
HostNick='anonsharing'
|
|
HostFuncPrefix='ansh'
|
|
HostUrls='anonsharing.com'
|
|
HostDomainRegex='^(http|https)://(.*\.)?anonsharing\.com/fileid\='
|
|
#!
|
|
#! !! DO NOT UPDATE OR REMOVE !!
|
|
#! This merges the Required HostAndDomainRegexes into mad.sh
|
|
ListHostAndDomainRegexes=${ListHostAndDomainRegexes}'/'${HostCode}'/'${HostNick}'/'${HostFuncPrefix}'/'${HostUrls}':'${HostDomainRegex}'@'
|
|
#!
|
|
#!
|
|
#! ------------ (1) Host Main Download Function --------------- #
|
|
#!
|
|
#! @REQUIRED: Host Main Download function
|
|
#! Must be named specifically as such:
|
|
#! <HostFuncPrefix>_DownloadFile()
|
|
ansh_DownloadFile() {
|
|
local remote_url=${1}
|
|
local file_url=${1}
|
|
local filecnt=${2}
|
|
warnAndRetryUnknownError=false
|
|
exitDownloadError=false
|
|
exitDownloadNotAvailable=false
|
|
fileAlreadyDone=false
|
|
download_inflight_path="${WorkDir}/.inflight/"
|
|
mkdir -p "$download_inflight_path"
|
|
completed_location="${WorkDir}/downloads/"
|
|
tor_identity="${RANDOM}"
|
|
finalAttempt="false"
|
|
for ((z=0; z<=$MaxUrlRetries; z++)); do
|
|
if [[ $z -eq $MaxUrlRetries ]] ; then
|
|
finalAttempt="true"
|
|
fi
|
|
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
|
|
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; echo ""; tput cnorm; exit" 0 1 2 3 6 15
|
|
if ansh_FetchFileInfo $finalAttempt && ansh_GetFile "${filecnt}" $((z+1)) $finalAttempt ; then
|
|
return 0
|
|
elif [[ $z -lt $MaxUrlRetries ]]; then
|
|
if [[ "${fileAlreadyDone}" == "true" ]] ; then
|
|
break
|
|
fi
|
|
if [[ "${warnAndRetryUnknownError}" == "true" ]] ; then
|
|
if [[ "${DebugAllEnabled}" == "true" ]] ; then
|
|
debugHtml "${remote_url##*/}" "error" "Retry due to an unknown issue: attempt #$((z+1)) of ${MaxUrlRetries}"
|
|
fi
|
|
fi
|
|
if [[ "${exitDownloadError}" == "true" || "${exitDownloadNotAvailable}" == "true" ]] ; then
|
|
if [[ "${DebugAllEnabled}" == "true" ]] ; then
|
|
debugHtml "${remote_url##*/}" "error" "Exit due to unrecoverable issue"
|
|
fi
|
|
rm -f "${WorkDir}/.flocks/${remote_url//[^a-zA-Z0-9]/}"
|
|
break
|
|
fi
|
|
echo -e "\n${YELLOW}A recoverable error occurred, retry attempt $((z+1))/${MaxUrlRetries}${NC}"
|
|
sleep 3
|
|
fi
|
|
done
|
|
rm -f "${WorkDir}/.flocks/${remote_url//[^a-zA-Z0-9]/}"
|
|
}
|
|
#!
|
|
#! ------------- (2) Fetch File Info Function ----------------- #
|
|
#!
|
|
ansh_FetchFileInfo() {
|
|
finalAttempt=$1
|
|
maxfetchretries=5
|
|
ansh_cookie_jar=""
|
|
local fileid="${remote_url##*fileid\=}"
|
|
echo -e "${GREEN}# Fetching download link…${NC}"
|
|
for ((i=1; i<=$maxfetchretries; i++)); do
|
|
mkdir -p "${WorkDir}/.temp"
|
|
ansh_cookie_jar=$(mktemp "${WorkDir}/.temp/ansh_cookies""${instance_no}"".XXXXXX")
|
|
printf " ."
|
|
tor_identity="${RANDOM}"
|
|
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
|
|
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; rm -f ${ansh_cookie_jar}; echo ""; tput cnorm; exit" 0 1 2 3 6 15
|
|
response=$(tor_curl_request --insecure -i -s \
|
|
-b "${ansh_cookie_jar}" -c "${ansh_cookie_jar}" \
|
|
-F "u=$fileid" \
|
|
-F "p=true" \
|
|
"https://anonsharing.com/account/ajax/file_details")
|
|
if [[ "${DebugAllEnabled}" == "true" ]] ; then
|
|
debugHtml "${remote_url##*/}" "ansh_postfileinfo$i" "${response}"
|
|
fi
|
|
if [[ -z $response ]] ; then
|
|
rm -f "${ansh_cookie_jar}";
|
|
if [[ $i == $maxfetchretries ]] ; then
|
|
printf "\\n"
|
|
echo -e "${RED}| Failed to extract download link [1]${NC}"
|
|
warnAndRetryUnknownError=true
|
|
if [[ "${finalAttempt}" == "true" ]] ; then
|
|
failedRetryDownload "${remote_url}" "Failed to extract download link [1]" ""
|
|
fi
|
|
return 1
|
|
else
|
|
continue
|
|
fi
|
|
fi
|
|
if grep -Eqi "There is no such file|File was deleted because" <<< "$response"; then
|
|
rm -f "${ansh_cookie_jar}";
|
|
printf "\\n"
|
|
echo -e "${RED}| The file was not found. It could be deleted or expired.${NC}"
|
|
exitDownloadError=true
|
|
removedDownload "${remote_url}"
|
|
return 1
|
|
fi
|
|
if grep -Eqi 'openUrl\('"'"'https:\\/\\/anonsharing.com\\/' <<< "$response"; then
|
|
printf "\\n"
|
|
echo -e "${GREEN}| Link found.${NC}"
|
|
download_url='https://anonsharing.com/'$(grep -oPi '(?<=openUrl\('"'"'https:\\/\\/anonsharing.com\\/).*?(?='"'"'.*$)' <<< "$response" | head -1)
|
|
download_url="${download_url//\\\//\/}"
|
|
download_url="${download_url//[$'\t\r\n\0']}"
|
|
break
|
|
else
|
|
rm -f "${ansh_cookie_jar}";
|
|
if [[ $i == $maxfetchretries ]] ; then
|
|
printf "\\n"
|
|
echo -e "${RED}| Failed to extract download link [2]${NC}"
|
|
warnAndRetryUnknownError=true
|
|
if [[ "${finalAttempt}" == "true" ]] ; then
|
|
failedRetryDownload "${remote_url}" "Failed to extract download link [2]" ""
|
|
fi
|
|
return 1
|
|
else
|
|
continue
|
|
fi
|
|
fi
|
|
break #Good to go here
|
|
done
|
|
bLocationFound=false
|
|
for ((j=1; j<=$maxfetchretries; j++)); do
|
|
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
|
|
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; rm -f ${ansh_cookie_jar}; echo ""; tput cnorm; exit" 0 1 2 3 6 15
|
|
if [[ "$bLocationFound" == "false" ]]; then
|
|
echo -e "${GREEN}# Fetching cdn and file info…${NC}"
|
|
file_header=$(tor_curl_request --insecure --head -L -i -s \
|
|
-b "${ansh_cookie_jar}" -c "${ansh_cookie_jar}" \
|
|
"$download_url")
|
|
else
|
|
echo -e "${GREEN}# Fetching file info…${NC}"
|
|
ansh_host="${download_url/https:\/\//}"
|
|
ansh_host="${ansh_host%%\/*}"
|
|
rm -f "${WorkDir}/.temp/directhead"
|
|
file_header=$(tor_curl_request --insecure --head -H "Connection: keep-alive" -s -i \
|
|
-H "Host: $ansh_host" \
|
|
"$download_url" |
|
|
tee "${WorkDir}/.temp/directhead" &
|
|
sleep 6
|
|
[ -s "${WorkDir}/.temp/directhead" ]
|
|
kill $! 2>/dev/null
|
|
)
|
|
if [[ ! -f "${WorkDir}/.flocks/${remote_url//[^a-zA-Z0-9]/}" ]]; then
|
|
touch "${WorkDir}/.flocks/${remote_url//[^a-zA-Z0-9]/}"
|
|
fi
|
|
rm -f "${WorkDir}/.temp/directhead"
|
|
fi
|
|
if [[ "${DebugAllEnabled}" == "true" ]] ; then
|
|
debugHtml "${remote_url##*/}" "ansh_head$j" "download_url: ${download_url}"$'\n'"${file_header}"
|
|
fi
|
|
if [[ -z $file_header ]] ; then
|
|
if [[ $j == $maxfetchretries ]] ; then
|
|
rm -f "${ansh_cookie_jar}";
|
|
printf "\\n"
|
|
echo -e "${RED}| Failed to extract file info.${NC}"
|
|
warnAndRetryUnknownError=true
|
|
if [[ "${finalAttempt}" == "true" ]] ; then
|
|
failedRetryDownload "${remote_url}" "" ""
|
|
fi
|
|
return 1
|
|
else
|
|
continue
|
|
fi
|
|
fi
|
|
if grep -Eqi '404 Not Found' <<< "$file_header"; then
|
|
rm -f "${ansh_cookie_jar}";
|
|
printf "\\n"
|
|
echo -e "${RED}| Failed to extract file info.${NC}"
|
|
warnAndRetryUnknownError=true
|
|
if [[ "${finalAttempt}" == "true" ]] ; then
|
|
failedRetryDownload "${remote_url}" "" ""
|
|
fi
|
|
return 1
|
|
fi
|
|
if grep -Eqi '302|location: ' <<< $file_header ; then
|
|
bLocationFound=true
|
|
download_url=$(grep -oPi -m 1 '(?<=location: ).*?(?=$)' <<< "$file_header")
|
|
download_url=${download_url//[$'\t\r\n']}
|
|
else
|
|
rm -f "${ansh_cookie_jar}";
|
|
printf "\\n"
|
|
echo -e "${RED}| Failed to get download url (no location)${NC}"
|
|
warnAndRetryUnknownError=true
|
|
if [[ "${finalAttempt}" == "true" ]] ; then
|
|
failedRetryDownload "${remote_url}" "Failed to get download url (no location)" ""
|
|
fi
|
|
return 1
|
|
fi
|
|
filename=$(grep -oP '(?<=filename=").*?(?=".*$)' <<< "$file_header")
|
|
if [[ "$filename_override" == "" ]] && [[ -z "$filename" ]] ; then
|
|
if [[ $j == $maxfetchretries ]] ; then
|
|
rm -f "${ansh_cookie_jar}";
|
|
printf "\\n"
|
|
echo -e "${RED}| Failed to extract file name${NC}"
|
|
warnAndRetryUnknownError=true
|
|
if [[ "${finalAttempt}" == "true" ]] ; then
|
|
failedRetryDownload "${remote_url}" "Failed to extract file name" ""
|
|
fi
|
|
return 1
|
|
else
|
|
continue
|
|
fi
|
|
fi
|
|
break #Good to go here
|
|
done
|
|
rm -f "${ansh_cookie_jar}";
|
|
touch "${WorkDir}/.flocks/${remote_url//[^a-zA-Z0-9]/}"
|
|
if [[ ! "$filename_override" == "" ]] ; then
|
|
filename="$filename_override"
|
|
fi
|
|
filename=$(sanitize_file_or_folder_name "${filename}")
|
|
printf "\\n"
|
|
echo -e "${YELLOW}| File name:${NC}\t\"${filename}\""
|
|
if [[ -z $file_size_bytes ]] ; then
|
|
file_size_readable="${RED}Unknown filesize…${NC}"
|
|
else
|
|
file_size_readable="$(numfmt --to=iec --from=auto --format "%.2f" <<< "$file_size_bytes")"
|
|
fi
|
|
echo -e "${YELLOW}| File size:${NC}\t${file_size_readable}"
|
|
file_path="${download_inflight_path}${filename}"
|
|
flockDownload="${WorkDir}/.flocks/${filename//[^a-zA-Z0-9\.\_\-]/}.flock"
|
|
if CheckFileSize "${remote_url}" "${file_size_bytes}" ; then
|
|
return 1
|
|
fi
|
|
if CheckDownloadExists "$remote_url" "$MoveToFolder" "$filecnt" "$filename" "$file_path" "$completed_location" ; then
|
|
return 1
|
|
fi
|
|
echo "${remote_url//[^a-zA-Z0-9]/}" > $flockDownload
|
|
}
|
|
#!
|
|
#! ----------- (3) Fetch File / Download File Function --------------- #
|
|
#!
|
|
ansh_GetFile() {
|
|
echo -e "${GREEN}# Downloading…"
|
|
echo -e "${YELLOW}| File path:${NC}\t./.inflight/${filename}\n"
|
|
fileCnt=$1
|
|
retryCnt=$2
|
|
finalAttempt=$3
|
|
flockDownload="${WorkDir}/.flocks/${filename//[^a-zA-Z0-9\.\_\-]/}.flock"
|
|
for ((j=1; j<=$MaxDownloadRetries; j++)); do
|
|
pd_presize=0
|
|
if [[ -f "$file_path" ]] ; then
|
|
pd_presize=$(stat --format="%s" "$file_path" | tr -d '[:space:]')
|
|
fi
|
|
GetRandomUA
|
|
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
|
|
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; rm -f ${ansh_cookie_jar}; rm -f $flockDownload; echo ""; tput cnorm; exit" 0 1 2 3 6 15
|
|
echo -e "${BLUE}| No Resume Fetch${NC} (unknown filesize)"
|
|
if [[ "${RateMonitorEnabled}" == "true" ]]; then
|
|
tor_curl_request --insecure --speed-limit $DownloadSpeedMin --speed-time $DownloadTimeoutInterval "$download_url" --output "$file_path"
|
|
else
|
|
tor_curl_request --insecure "$download_url" --output "$file_path"
|
|
fi
|
|
received_file_size=0
|
|
if [[ -f "$file_path" ]] ; then
|
|
received_file_size=$(stat --format="%s" "$file_path" | tr -d '[:space:]')
|
|
fi
|
|
if CheckNoHtml "$remote_url" "$filename" "$file_path" "$((received_file_size - pd_presize))" ; then
|
|
containsHtml=false
|
|
else
|
|
containsHtml=true
|
|
fi
|
|
if [[ "${AutoRepairBadPartials}" == "true" ]] && [[ "$containsHtml" == "true" ]] ; then
|
|
if [[ -f "${file_path}" ]] ; then
|
|
if ((pd_presize > 0)); then
|
|
echo -e "${YELLOW}Bad node / HTML found:${NC} reverting to previous file..."
|
|
truncateDownload "$remote_url" "$filename" "$pd_presize" "$received_file_size"
|
|
truncate -s $pd_presize "${file_path}"
|
|
else
|
|
echo -e "${YELLOW}Bad node / HTML found:${NC} tainted partial removed..."
|
|
rm -f "${file_path}"
|
|
fi
|
|
fi
|
|
if ((j >= $MaxDownloadRetries)) ; then
|
|
rm -f "$flockDownload";
|
|
if [[ "${finalAttempt}" == "true" ]] ; then
|
|
droppedSizeBadDownload "${remote_url}" "${filename}" "${received_file_size}"
|
|
fi
|
|
return 1
|
|
else
|
|
continue
|
|
fi
|
|
fi
|
|
break
|
|
done
|
|
rm -f "$flockDownload";
|
|
ProcessCompletedDownload "$remote_url" "$MoveToFolder" "$filecnt" "$filename" "$file_size_bytes" "$completed_location" "$file_path"
|
|
return 0
|
|
}
|
|
#!
|
|
#! --------------- Host Extra Functions ------------------- #
|
|
#!
|