mad/hosts/1fichier.sh
kittykat 270e378e08
# 2025.03.30 - [ranoz] Fix to handle new cookie requirements
# 2025.03.28 - [up_ranoz] Fix to handle new cookie requirements
# 2025.03.28 - [up_anonfileio] Add anonfile.io as upload host
# 2025.03.28 - [anonfileio] Add anonfile.io as download host
# 2025.03.25 - [up_ranoz] Disable MAD randomized extension on uploads (7z block disabled)
# 2025.03.21 - [mad] Update random user agents 2025.03
# 2025.03.20 - [jira hosts] Update 3 jira hosts (retention and maxsize)
# 2025.03.16 - [torup] Fix torup cookies
# 2025.03.15 - [1fichier] Get new node prior to cdn download (greater possibility of a faster node)
# 2025.03.10 - [uploadscloud] Add uploadscloud.com as download host
2025-04-01 07:09:17 +00:00

383 lines
18 KiB
Bash

#! Name: 1fichier.sh
#! Author: kittykat
#! Version: 2025.03.15
#! Desc: Add support for downloading and processing of urls for a new host
#! Usage: Copy this file into the ./${ScriptDir}/hosts/ folder
#!
#!
#! ------------ REQUIRED SECTION ---------------
#! @[UPDATE] HostAndDomainRegexes: This string is loaded into mad.sh and allows dynamic handling of new url data
#! Format: '/HostCode/HostNick/HostFuncPrefix:HostDomainRegex@'
#! HostCode: <aUniqueCodeForHost> (ie. 'fh' for filehaus -- cannot be used by other hosts)
#! HostNick: What is displayed throughout MAD output (ie. 'filehaus' -- "urls.txt has 10 filehaus.." will be displayed)
#! HostFuncPrefix: <aUniqueStringThatMustPrefixHostFunctions> (ie. 'fh' -- fh_DownloadFile(), fh_FetchFileInfo() .. )
#! * Note: Must begin with a letter a-z (functions beginning with numbers are no bueno)
#! HostDomainRegex: The regex used to verify matching urls
HostCode='1f'
HostNick='1fichier'
HostFuncPrefix='fich'
HostUrls='1fichier.com, tenvoi.com, alterupload.com, cjoint.net, desfichiers.com, dfichiers.com, megadl.fr, mesfichiers.org, piecejointe.net, pjointe.com, dl4free.com'
HostDomainRegex='^(http|https)://(.*\.)?(1fichier\.com|tenvoi\.com|alterupload\.com|cjoint\.net|desfichiers\.com|dfichiers\.com|megadl\.fr|mesfichiers\.org|piecejointe\.net|pjointe\.com|dl4free\.com)/\?[a-z0-9]{20}$'
#!
#! !! DO NOT UPDATE OR REMOVE !!
#! This merges the Required HostAndDomainRegexes into mad.sh
ListHostAndDomainRegexes=${ListHostAndDomainRegexes}'/'${HostCode}'/'${HostNick}'/'${HostFuncPrefix}'/'${HostUrls}':'${HostDomainRegex}'@'
#!
#!
#! ------------ (1) Host Main Download Function --------------- #
#!
#! @REQUIRED: Host Main Download function
#! Must be named specifically as such:
#! <HostFuncPrefix>_DownloadFile()
fich_DownloadFile() {
warnAndRetryUnknownError=false
exitDownloadError=false
exitDownloadNotAvailable=false
fileAlreadyDone=false
local remote_url=${1}
local filecnt=${2}
fich_cookie_jar=""
fich_adz_parameter=""
target_file_link=""
fich_user_provided_password=""
is_password_protected=false
for ((y=1; y<=15; y++)); do
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; rm -f $lockfile; echo ""; tput cnorm; exit" 0 1 2 3 6 15
tor_identity="${RANDOM}"
PAGE=$(tor_curl_request --insecure --max-time "$ConnectTimeout" -s "${remote_url}")
if [[ "${DebugAllEnabled}" == "true" ]] ; then
debugHtml "${remote_url##*/?}" "prechk$y" "${PAGE}"
fi
file_information=$(grep -oP '(?<=<td class="normal">)[^<]*?(?=</td>)' <<< "${PAGE}")
size=$(echo "${file_information}" | tail -n 1)
filename=$(echo "${file_information}" | head -n 1)
if [[ ! "$filename_override" == "" ]] ; then
filename="$filename_override"
fi
filename=$(sanitize_file_or_folder_name "${filename}")
download_inflight_path="${WorkDir}/.inflight/"
completed_location="${WorkDir}/downloads/"
if grep -Eqi "The requested file has been deleted for inactivity|Le fichier demandé a été supprimé automatiquement pour inactivité" <<< "${PAGE}"; then
echo -e "\n${RED}The file in URL (${remote_url}) was removed due to inactivity${NC}"
removedDownload "${remote_url}"
return 1
elif
grep -Eqi "The requested file does not exist|It could be deleted by its owner" <<< "${PAGE}"; then
echo -e "\n${RED}The file in URL (${remote_url}) does not exist. Is the URL correct?${NC}"
removedDownload "${remote_url}"
return 1
elif
grep -Eqi "The requested file has been deleted|Le fichier demandé a été supprimé" <<< "${PAGE}"; then
echo -e "\n${RED}The file in URL (${remote_url}) has been deleted by owner${NC}"
removedDownload "${remote_url}"
return 1
elif
grep -Eqi "Le fichier demandé a été supprimé suite à un rapport d'abus|The requested file has been deleted following an abuse request" <<< "${PAGE}"; then
echo -e "\n${RED}The file in URL (${remote_url}) was reported and removed by 1fichier${NC}"
removedDownload "${remote_url}"
return 1
elif
grep -Eqi "deleted after its free hosting period expired" <<< "${PAGE}"; then
echo -e "\n${RED}The file in URL (${remote_url}) has expired and is removed${NC}"
removedDownload "${remote_url}"
return 1
elif
grep -Eqi "Le fichier demandé a été supprimé suite à une notification|The requested file has been deleted following a notification" <<< "${PAGE}"; then
echo -e "\n${RED}The file in URL (${remote_url}) was reported and removed by 1fichier${NC}"
removedDownload "${remote_url}"
return 1
fi
if [[ -z "$filename" || -z "$size" || ${size//[!0-9]/} =~ '^[0-9]+([.][0-9]+?$' ]]; then
if ((y == MaxUrlRetries )) ; then
echo -e "\n${RED}ERROR: Filename or size not found${NC}"
echo -e "url: ${remote_url}"
echo -e "filename: $filename"
echo -e "size: $size"
filenameOrSizeNotExistDownload "${remote_url}" "${filename}" "${size}"
return 1
fi
printf " ."
sleep 1
continue # Try again if not MaxUrlRetries
fi
if grep -q "id=\"pass\"" <<< "${PAGE}"; then
echo -e "${YELLOW}This download requires a password${NC}"
passwordProtectedDownload "${remote_url}"
return 1
fi
if ((y > 1 )) ; then
printf "\\n"
fi
echo -e "${GREEN}${filename} (${size}) is available.${NC}"
break
done
finalAttempt="false"
for ((z=0; z<=$MaxUrlRetries; z++)); do
if [[ $z -eq $MaxUrlRetries ]] ; then
finalAttempt="true"
fi
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; echo ""; tput cnorm; exit" 0 1 2 3 6 15
if fich_FindEmptySlot && fich_FetchFileInfo "" $((z+1)) $finalAttempt && fich_GetFile "${filecnt}" $((z+1)) $finalAttempt $filename ; then
return 0
elif [[ $z -lt $MaxUrlRetries ]]; then
if [[ "${fileAlreadyDone}" == "true" ]] ; then
break
fi
if [[ "${warnAndRetryUnknownError}" == "true" ]] ; then
if [[ "${DebugAllEnabled}" == "true" ]] ; then
debugHtml "${remote_url##*/?}" "error" "Retry due to an unknown issue: attempt #$((z+1)) of ${MaxUrlRetries}"
fi
fi
if [[ "${exitDownloadError}" == "true" || "${exitDownloadNotAvailable}" == "true" ]] ; then
if [[ "${DebugAllEnabled}" == "true" ]] ; then
debugHtml "${remote_url##*/?}" "error" "Exit due to unrecoverable issue"
fi
rm -f "${WorkDir}/.flocks/${remote_url//[^a-zA-Z0-9]/}"
break
fi
echo -e "\n${YELLOW}A recoverable error occurred, retry attempt $((z+1))/${MaxUrlRetries}${NC}"
sleep 3
fi
done
rm -f "${WorkDir}/.flocks/${remote_url//[^a-zA-Z0-9]/}"
}
#!
#! ------------- (2) Fetch File Info Function ----------------- #
#!
fich_FetchFileInfo() {
local fileCnt=$1
local num_attempt=$2
local finalAttempt=$3
echo -e "\nTrying to get CDN URL"
fich_adz_parameter=$(cat "${WorkDir}/.temp/fich_adz_parameter")
fich_cookie_jar=$(cat "${WorkDir}/.temp/fich_cookie_jar")
tor_identity=$(cat "${WorkDir}/.temp/fich_tor_identity")
rm -f "${WorkDir}/.temp/fich_cookie_jar"; rm -f "${WorkDir}/.temp/fich_adz_parameter"; rm -f "${WorkDir}/.temp/fich_tor_identity";
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; rm -f "${fich_cookie_jar}"; echo ""; tput cnorm; exit" 0 1 2 3 6 15
cdn_request=$(tor_curl_request --insecure -s -L -b "${fich_cookie_jar}" -c "${fich_cookie_jar}" -F "submit=Download" -F "pass=${fich_user_provided_password}" -F "adz=${fich_adz_parameter}" "${remote_url}")
target_file_link=$(echo "$cdn_request" | grep -A 2 '<div style="width:600px;height:80px;margin:auto;text-align:center;vertical-align:middle">' | grep -oP '<a href="\K[^"]+')
if [[ "${DebugAllEnabled}" == "true" ]] ; then
debugHtml "${remote_url##*/?}" "fich_cdn${num_attempt}_1" "target_file_link: ${target_file_link}"$'\n'"${cdn_request}"
fi
rm -f "${fich_cookie_jar}"
if ! grep -Eqi "https://" <<< "${target_file_link}" > /dev/null ; then
if $is_password_protected; then
echo -e "${RED}ERROR: Incorrect password${NC}\nSince this download required a password, you might have copied it incorrectly?"
passwordProtectedDownload "${remote_url}"
exitDownloadError=true
return 2
else
echo -e "${RED}ERROR: Could not find CDN URL${NC}"
if [[ "${finalAttempt}" == "true" ]] ; then
noCdnDownload "${remote_url}"
fi
return 1
fi
fi
echo -e "${GREEN}CDN URL has been found!${NC}"
}
#!
#! ----------- (3) Fetch File / Download File Function --------------- #
#!
fich_GetFile() {
local filecnt=$1
local num_attempt=$2
local finalAttempt=$3
local filename=$4
echo -e "\n${RED}${NC} Saving ${GREEN}${remote_url##*/?}${NC} to ${GREEN}${filename}${NC}"
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
for ((j=1; j<=4; j++)); do
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; echo ""; tput cnorm; exit" 0 1 2 3 6 15
file_header=$(tor_curl_request --insecure -sSIL -e "${remote_url}" "${target_file_link}")
file_size_bytes=$(grep -oPi '(?<=content-length: ).*' <<< "$file_header")
file_size_bytes=${file_size_bytes//[$'\t\r\n']}
download_inflight_path="${WorkDir}/.inflight/"
completed_location="${WorkDir}/downloads/"
file_path="${download_inflight_path}${filename}"
if [[ "${DebugAllEnabled}" == "true" ]] ; then
debugHtml "${remote_url##*/?}" "fich_savehead${num_attempt}_${j}" "target_file_link: ${target_file_link}"$'\n'"${file_header}"
fi
if [[ -z "$file_header" ]] || [[ -z "$file_size_bytes" ]]; then
continue
else
break
fi
done
if grep -Eqi "200 OK" <<< "${file_header}" > /dev/null ; then
echo "We good" > /dev/null
elif grep -Eqi "410 Gone" <<< "${file_header}" > /dev/null ; then
echo -e "${RED}ERROR: Failed to retrieve file header (410 Gone).${NC}\nThis could be due to 1fichier experiencing a temporary issue."
if [[ "${finalAttempt}" == "true" ]] ; then
failedDownload "${remote_url}" "${filename}" "410 Gone"
fi
return 1
elif grep -Eqi "403 Forbidden" <<< "${file_header}" > /dev/null ; then
echo -e "${RED}ERROR: Failed to retrieve file header (403 Forbidden).${NC}\nThis could be due to 1fichier experiencing a temporary issue."
if [[ "${finalAttempt}" == "true" ]] ; then
failedDownload "${remote_url}" "${filename}" "403 Forbidden"
fi
return 1
else
echo -e "${RED}ERROR: Failed to retrieve file header (Unknown Head Response).${NC}\nThis could be due to 1fichier experiencing a temporary issue."
if [[ "${finalAttempt}" == "true" ]] ; then
failedDownload "${remote_url}" "${filename}" "Unknown Head Response"
fi
return 1
fi
size_value=$(echo $size | cut -f1 -d' ')
size_unit=$(echo $size | cut -f2 -d' ')
case $size_unit in
KB|Ko) size_bytes=$(echo "$size_value * 1000" | bc);;
MB|Mo) size_bytes=$(echo "$size_value * 1000 * 1000" | bc);;
GB|Go) size_bytes=$(echo "$size_value * 1000 * 1000 * 1000" | bc);;
TB|To) size_bytes=$(echo "$size_value * 1000 * 1000 * 1000 * 1000" | bc);;
*) size_bytes=$size_value;;
esac
percent_threshold=0.01 # 1% error threshold, should be fine
percent_numerator=$(echo "$file_size_bytes - $size_bytes" | bc)
percent_diff=$(echo "${percent_numerator/-/} / (($file_size_bytes + $size_bytes) / 2)" | bc -l)
if (( $(echo "$percent_diff > $percent_threshold" |bc -l) )); then
echo -e "${RED}ERROR: The difference between the advertised and retrieved file size is too big${NC}\nThis is most likely due to someone else taking the slot or some other error along the way."
echo -e "AdvertisedSize: $size ($size_bytes), Size: $file_size_bytes, Diff: $percent_diff"
if [[ "${finalAttempt}" == "true" ]] ; then
droppedSizeBadDownload "${remote_url}" "${filename}" "${file_size_bytes}" "${size}"
fi
return 1
fi
flockDownload="${WorkDir}/.flocks/${filename//[^a-zA-Z0-9\.\_\-]/}.flock"
if CheckFileSize "${remote_url}" ${file_size_bytes} ; then
return 1
fi
if CheckDownloadExists "$remote_url" "$MoveToFolder" "$filecnt" "$filename" "$file_path" "$completed_location" ; then
return 1
fi
echo "${remote_url//[^a-zA-Z0-9]/}" > $flockDownload
touch "${WorkDir}/.flocks/${remote_url//[^a-zA-Z0-9]/}"
tor_identity="${RANDOM}"
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; rm -f $flockDownload; echo ""; tput cnorm; exit" 0 1 2 3 6 15
tor_curl_request --insecure -e "${remote_url}" "${target_file_link}" -C - -o "${file_path}"
rm -f "$flockDownload";
received_file_size=0
if [[ -f "$file_path" ]] ; then
received_file_size=$(stat --format="%s" "$file_path" | tr -d '[:space:]')
fi
if [[ "${received_file_size}" -ne "${file_size_bytes}" ]]; then
echo -e "${RED}ERROR: Size mismatch after downloading${NC}\nPerhaps you or 1fichier lost connection for a while?"
if [[ "${finalAttempt}" == "true" ]] ; then
droppedSizeBadDownload "${remote_url}" "${filename}" "${received_file_size}"
fi
return 1
fi
ProcessCompletedDownload "$remote_url" "$MoveToFolder" "$filecnt" "$filename" "$file_size_bytes" "$completed_location" "$file_path"
}
#!
#! --------------- Host Extra Functions ------------------- #
#!
fich_FindEmptySlot() {
mkdir -p "${WorkDir}/.temp"
local lockfile="${WorkDir}/.temp/lockfile.lock"
timer_start=$(date +%s)
while [[ -e $lockfile ]]; do
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; rm -f $lockfile; echo ""; tput cnorm; exit" 0 1 2 3 6 15
timer_duration=$(($(date +%s) - timer_start))
echo -e "Lock file in place, time elapsed: $timer_duration seconds"
sleep 1
printf "\033[F"
tput el
done
touch $lockfile
echo -e "\nSearching for a usable exit node"
mkdir -p "${WorkDir}/.temp"
rm -f "${WorkDir}/.temp/fich_adz_parameter"
sleep 0.2
instances="10"
timer_start=$(date +%s)
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
trap 'rm -f "${WorkDir}/.flocks/${CLEANSTRING}"; rm -f $lockfile; tput el; echo -e "${RED}Aborted by user!${NC}"; for i in $(seq 1 $instances); do tput el; echo ""; done; rm -f "${WorkDir}/.temp/fich_cookie_jar"; rm -f "${WorkDir}/.temp/fich_adz_parameter"; rm -f "${WorkDir}/.temp/tor_identity"; echo -e "${RED}Aborted by user!${NC}"; tput cnorm; exit' 0 1 2 3 6 15
for instance_no in $(seq 1 $instances); do
fich_FetchTorExitNode "${instance_no}" ${instances} &
sleep 0.1
done
wait
CLEANSTRING=${remote_url//[^a-zA-Z0-9]/}
trap "rm -f ${WorkDir}/.flocks/${CLEANSTRING}; rm -f $lockfile; rm -f "${WorkDir}/.temp/fich_cookie_jar"; rm -f "${WorkDir}/.temp/fich_adz_parameter"; rm -f "${WorkDir}/.temp/tor_identity"; echo ""; tput cnorm; exit" 0 1 2 3 6 15
if [[ $(stat -c '%s' "${WorkDir}/.temp/fich_adz_parameter") -lt 1 ]]; then
echo -e "${RED}One of the instances ran out of attempts, try again later${NC}"
return 1
fi
timer_end=$(date +%s)
timer_duration=$((timer_end - timer_start))
tput el
echo -e "${GREEN}Search took ${timer_duration} seconds${NC}"
rm -f $lockfile
}
fich_FetchTorExitNode() {
local max_attempts=${CircuitRetries}
local iter=0 instance_no="$1" time_out=5 instances="$2" fich_cookie_jar="" tor_identity="" fich_adz_parameter="" PAGE=""
mkdir -p "${WorkDir}/.temp"
while :; do
if [[ "${iter}" -ge "${max_attempts}" ]]; then
rm -f "$fich_cookie_jar"
if [[ -s "${WorkDir}/.temp/fich_adz_parameter" ]]; then
rm -f "$fich_cookie_jar"
exit 1
fi
echo "" > "${WorkDir}/.temp/fich_adz_parameter"
for i in $(seq 1 "$instances"); do echo ""; done
echo -e "\n${RED}Instance ${instance_no} ran out of attempts${NC}"
exit 1
fi
((iter++))
if [[ -s "${WorkDir}/.temp/fich_adz_parameter" ]]; then
tput el
printf "Closing instance %s\r" "${instance_no}"
rm -f "${fich_cookie_jar}" # new
exit 1
fi
for ((i=1; i<=instance_no; i++)) ; do
printf "\\n"
done
printf "Instance %s \t| Attempt %s \r" "${instance_no}" "${iter}/${max_attempts}"
for ((i=1; i<=instance_no; i++)) ; do
printf "\033[F"
done
if [[ ! $fich_adz_parameter ]]; then
rm -f "$fich_cookie_jar"
fich_cookie_jar=$(mktemp "${WorkDir}/.temp/fich_cookies""${instance_no}"".XXXXXX")
fi
tor_identity="${RANDOM}"
trap "rm -f ${fich_cookie_jar}; echo ""; tput cnorm; exit" 0 1 2 3 6 15
PAGE=$(tor_curl_request --insecure --max-time "$ConnectTimeout" -c "${fich_cookie_jar}" -s "${remote_url}")
if [[ -z ${PAGE} ]]; then
rm -f "${fich_cookie_jar}"
continue
fi
if grep -Eqi '<span style="color:red">Warning !</span>|<span style="color:red">Attention !</span>' <<< "${PAGE}"; then
rm -f "${fich_cookie_jar}"
continue
else
fich_adz_parameter=$(grep -oPi 'name="adz" value="\K[^"]+' <<< "${PAGE}")
if [[ $fich_adz_parameter ]]; then
if [[ -s "${WorkDir}/.temp/fich_adz_parameter" ]]; then
rm -f "$fich_cookie_jar"
exit 1
fi
echo "$fich_adz_parameter" > "${WorkDir}/.temp/fich_adz_parameter"
echo "$fich_cookie_jar" > "${WorkDir}/.temp/fich_cookie_jar"
echo "$tor_identity" > "${WorkDir}/.temp/fich_tor_identity"
rm -f "$fich_cookie_jar"
for i in $(seq 1 "$instances"); do echo ""; done
echo ""
tput el
echo -e "${GREEN}Slot found by instance ${instance_no}${NC}"
break
fi
fi
done
tput cnorm
}