finally don't use kivy

This commit is contained in:
Mylloon 2021-08-27 00:19:21 +02:00
parent 35b2db7395
commit f703645d77
6 changed files with 199 additions and 553 deletions

5
.gitignore vendored
View file

@ -5,8 +5,3 @@ pyvenv.cfg
# vscode # vscode
.vscode/ .vscode/
# app
.env
results.csv
.buildozer/

View file

@ -8,11 +8,6 @@ Or create `.env` file inside the repo folder with `PSEUDO_MOBILISM`, `PASSWORD_M
You can also add `DEBUG_MOBILISM` variable to add some verboses (only to `.env` file). You can also add `DEBUG_MOBILISM` variable to add some verboses (only to `.env` file).
### [Build](https://kivy.org/doc/stable/guide/packaging-android.html)
Install requirements: `pip install -r requirements.txt`
Install his [dependencies](https://buildozer.readthedocs.io/en/latest/installation.html#targeting-android) (you may need to delete your existing `.buildozer` folder)
Plug in your android device and run `buildozer android release`
#### Applications tested #### Applications tested
``` ```
Plex, Spotify, Tiktok, Clash of Clans, Clash Royale, Twitch, Brawl Stars Plex, Spotify, Tiktok, Clash of Clans, Clash Royale, Twitch, Brawl Stars

View file

@ -1,329 +0,0 @@
[app]
# (str) Title of your application
title = MobiDL
# (str) Package name
package.name = mobidownloader
# (str) Package domain (needed for android/ios packaging)
package.domain = com.mylloon
# (str) Source code where the main.py live
source.dir = .
# (list) Source files to include (let empty to include all the files)
source.include_exts = py,png,kv,atlas
# (list) List of inclusions using pattern matching
#source.include_patterns =
# (list) Source files to exclude (let empty to not exclude anything)
#source.exclude_exts = spec,md,txt,csv,gitignore,env
# (list) List of directory to exclude (let empty to not exclude anything)
#source.exclude_dirs = tests, bin, lib, .vscode
# (list) List of exclusions using pattern matching
#source.exclude_patterns = LICENCE,images/*/*.jpg
# (str) Application versioning (method 1)
version = 0.1
# (str) Application versioning (method 2)
# version.regex = __version__ = ['"](.*)['"]
# version.filename = %(source.dir)s/main.py
# (list) Application requirements
# comma separated e.g. requirements = sqlite3,kivy
requirements = python3,kivy,requests,python-dotenv,cloudscraper
# (str) Custom source folders for requirements
# Sets custom source for any requirements with recipes
# requirements.source.kivy = ../../kivy
# (list) Garden requirements
#garden_requirements =
# (str) Presplash of the application
#presplash.filename = %(source.dir)s/data/presplash.png
# (str) Icon of the application
#icon.filename = %(source.dir)s/data/icon.png
# (str) Supported orientation (one of landscape, sensorLandscape, portrait or all)
orientation = portrait
# (list) List of service to declare
#services = NAME:ENTRYPOINT_TO_PY,NAME2:ENTRYPOINT2_TO_PY
#
# OSX Specific
#
#
# author = © Copyright Info
# change the major version of python used by the app
osx.python_version = 3
# Kivy version to use
osx.kivy_version = 1.9.1
#
# Android specific
#
# (bool) Indicate if the application should be fullscreen or not
fullscreen = 0
# (string) Presplash background color (for new android toolchain)
# Supported formats are: #RRGGBB #AARRGGBB or one of the following names:
# red, blue, green, black, white, gray, cyan, magenta, yellow, lightgray,
# darkgray, grey, lightgrey, darkgrey, aqua, fuchsia, lime, maroon, navy,
# olive, purple, silver, teal.
#android.presplash_color = black
# (list) Permissions
#android.permissions = INTERNET
# (int) Target Android API, should be as high as possible.
#android.api = 27
# (int) Minimum API your APK will support.
#android.minapi = 21
# (int) Android SDK version to use
#android.sdk = 20
# (str) Android NDK version to use
#android.ndk = 19b
# (int) Android NDK API to use. This is the minimum API your app will support, it should usually match android.minapi.
#android.ndk_api = 21
# (bool) Use --private data storage (True) or --dir public storage (False)
#android.private_storage = True
# (str) Android NDK directory (if empty, it will be automatically downloaded.)
#android.ndk_path =
# (str) Android SDK directory (if empty, it will be automatically downloaded.)
#android.sdk_path =
# (str) ANT directory (if empty, it will be automatically downloaded.)
#android.ant_path =
# (bool) If True, then skip trying to update the Android sdk
# This can be useful to avoid excess Internet downloads or save time
# when an update is due and you just want to test/build your package
# android.skip_update = False
# (bool) If True, then automatically accept SDK license
# agreements. This is intended for automation only. If set to False,
# the default, you will be shown the license when first running
# buildozer.
# android.accept_sdk_license = True
# (str) Android entry point, default is ok for Kivy-based app
#android.entrypoint = org.renpy.android.PythonActivity
# (str) Android app theme, default is ok for Kivy-based app
# android.apptheme = "@android:style/Theme.NoTitleBar"
# (list) Pattern to whitelist for the whole project
#android.whitelist =
# (str) Path to a custom whitelist file
#android.whitelist_src =
# (str) Path to a custom blacklist file
#android.blacklist_src =
# (list) List of Java .jar files to add to the libs so that pyjnius can access
# their classes. Don't add jars that you do not need, since extra jars can slow
# down the build process. Allows wildcards matching, for example:
# OUYA-ODK/libs/*.jar
#android.add_jars = foo.jar,bar.jar,path/to/more/*.jar
# (list) List of Java files to add to the android project (can be java or a
# directory containing the files)
#android.add_src =
# (list) Android AAR archives to add (currently works only with sdl2_gradle
# bootstrap)
#android.add_aars =
# (list) Gradle dependencies to add (currently works only with sdl2_gradle
# bootstrap)
#android.gradle_dependencies =
# (list) add java compile options
# this can for example be necessary when importing certain java libraries using the 'android.gradle_dependencies' option
# see https://developer.android.com/studio/write/java8-support for further information
# android.add_compile_options = "sourceCompatibility = 1.8", "targetCompatibility = 1.8"
# (list) Gradle repositories to add {can be necessary for some android.gradle_dependencies}
# please enclose in double quotes
# e.g. android.gradle_repositories = "maven { url 'https://kotlin.bintray.com/ktor' }"
#android.add_gradle_repositories =
# (list) packaging options to add
# see https://google.github.io/android-gradle-dsl/current/com.android.build.gradle.internal.dsl.PackagingOptions.html
# can be necessary to solve conflicts in gradle_dependencies
# please enclose in double quotes
# e.g. android.add_packaging_options = "exclude 'META-INF/common.kotlin_module'", "exclude 'META-INF/*.kotlin_module'"
#android.add_gradle_repositories =
# (list) Java classes to add as activities to the manifest.
#android.add_activities = com.example.ExampleActivity
# (str) OUYA Console category. Should be one of GAME or APP
# If you leave this blank, OUYA support will not be enabled
#android.ouya.category = GAME
# (str) Filename of OUYA Console icon. It must be a 732x412 png image.
#android.ouya.icon.filename = %(source.dir)s/data/ouya_icon.png
# (str) XML file to include as an intent filters in <activity> tag
#android.manifest.intent_filters =
# (str) launchMode to set for the main activity
#android.manifest.launch_mode = standard
# (list) Android additional libraries to copy into libs/armeabi
#android.add_libs_armeabi = libs/android/*.so
#android.add_libs_armeabi_v7a = libs/android-v7/*.so
#android.add_libs_arm64_v8a = libs/android-v8/*.so
#android.add_libs_x86 = libs/android-x86/*.so
#android.add_libs_mips = libs/android-mips/*.so
# (bool) Indicate whether the screen should stay on
# Don't forget to add the WAKE_LOCK permission if you set this to True
#android.wakelock = False
# (list) Android application meta-data to set (key=value format)
#android.meta_data =
# (list) Android library project to add (will be added in the
# project.properties automatically.)
#android.library_references =
# (list) Android shared libraries which will be added to AndroidManifest.xml using <uses-library> tag
#android.uses_library =
# (str) Android logcat filters to use
#android.logcat_filters = *:S python:D
# (bool) Copy library instead of making a libpymodules.so
#android.copy_libs = 1
# (str) The Android arch to build for, choices: armeabi-v7a, arm64-v8a, x86, x86_64
android.arch = arm64-v8a
# (int) overrides automatic versionCode computation (used in build.gradle)
# this is not the same as app version and should only be edited if you know what you're doing
# android.numeric_version = 1
#
# Python for android (p4a) specific
#
# (str) python-for-android fork to use, defaults to upstream (kivy)
#p4a.fork = kivy
# (str) python-for-android branch to use, defaults to master
#p4a.branch = master
# (str) python-for-android git clone directory (if empty, it will be automatically cloned from github)
#p4a.source_dir =
# (str) The directory in which python-for-android should look for your own build recipes (if any)
#p4a.local_recipes =
# (str) Filename to the hook for p4a
#p4a.hook =
# (str) Bootstrap to use for android builds
# p4a.bootstrap = sdl2
# (int) port number to specify an explicit --port= p4a argument (eg for bootstrap flask)
#p4a.port =
#
# iOS specific
#
# (str) Path to a custom kivy-ios folder
#ios.kivy_ios_dir = ../kivy-ios
# Alternately, specify the URL and branch of a git checkout:
ios.kivy_ios_url = https://github.com/kivy/kivy-ios
ios.kivy_ios_branch = master
# Another platform dependency: ios-deploy
# Uncomment to use a custom checkout
#ios.ios_deploy_dir = ../ios_deploy
# Or specify URL and branch
ios.ios_deploy_url = https://github.com/phonegap/ios-deploy
ios.ios_deploy_branch = 1.7.0
# (str) Name of the certificate to use for signing the debug version
# Get a list of available identities: buildozer ios list_identities
#ios.codesign.debug = "iPhone Developer: <lastname> <firstname> (<hexstring>)"
# (str) Name of the certificate to use for signing the release version
#ios.codesign.release = %(ios.codesign.debug)s
[buildozer]
# (int) Log level (0 = error only, 1 = info, 2 = debug (with command output))
log_level = 2
# (int) Display warning if buildozer is run as root (0 = False, 1 = True)
warn_on_root = 1
# (str) Path to build artifact storage, absolute or relative to spec file
# build_dir = ./.buildozer
# (str) Path to build output (i.e. .apk, .ipa) storage
# bin_dir = ./bin
# -----------------------------------------------------------------------------
# List as sections
#
# You can define all the "list" as [section:key].
# Each line will be considered as a option to the list.
# Let's take [app] / source.exclude_patterns.
# Instead of doing:
#
#[app]
#source.exclude_patterns = license,data/audio/*.wav,data/images/original/*
#
# This can be translated into:
#
#[app:source.exclude_patterns]
#license
#data/audio/*.wav
#data/images/original/*
#
# -----------------------------------------------------------------------------
# Profiles
#
# You can extend section / key with a profile
# For example, you want to deploy a demo version of your application without
# HD content. You could first change the title to add "(demo)" in the name
# and extend the excluded directories to remove the HD content.
#
#[app@demo]
#title = My Application (demo)
#
#[app:source.exclude_patterns@demo]
#images/hd/*
#
# Then, invoke the command line with the "demo" profile:
#
#buildozer --profile demo android debug

206
main.py
View file

@ -1,10 +1,202 @@
import kivy from sys import argv
from kivy.app import App from os import environ
from kivy.uix.label import Label from dotenv import load_dotenv
from cloudscraper import CloudScraper, create_scraper
from re import findall, sub
class MobiDL(App): class Scraper:
def build(self): def __init__(self, pseudo: str, password: str, app: str, debug: bool = False):
return Label(text = "...") self.debug = debug
self.url = "https://forum.mobilism.org"
self.requested_app = app
self.loginData = {
"username": pseudo,
"password": password,
"login": "Login"
}
def errorFormat(self, code: int = None, message: str = "") -> str:
"""Pretty error message."""
return f"{f'[{code}]' if code else ''}{' ' if len(message) > 0 and code else ''}{message}."
def connect(self) -> CloudScraper:
"""Login to the forum using credentials."""
session = create_scraper(browser = {"browser": "chrome", "platform": "windows"}) # connect with cloudflare bypasser with a chrome browser on windows
if not session:
raise SystemError(self.errorFormat(message = "The creation of the session failed")) # called only if failed at creating the session
if self.debug: print("Connection attempt...")
reponse = session.post(f"{self.url}/ucp.php", data = self.loginData, params = {"mode": "login"}) # connect to the forum using credentials - params are set by default but its in case forum changing that
if reponse.status_code != 200:
raise ConnectionRefusedError(self.errorFormat(code = reponse.status_code, message = "Unable to connect")) # called only status code isn't 200
return session
def search(self, session: CloudScraper) -> tuple[list[dict], list[dict]]:
"""Do the research."""
if self.debug: print("Going to search page and check connection...", end = " ")
reponse = session.get(f"{self.url}/search.php", params = {"keywords": self.requested_app, "sr": "topics", "sf": "titleonly"}) # fetch results page
if "Sorry but you are not permitted to use the search system. If you're not logged in please" in reponse.text:
raise ConnectionError(self.errorFormat(message = "Connection failed, check credentials")) # called only if login failed
if reponse.status_code != 200:
raise ConnectionError(self.errorFormat(code = reponse.status_code, message = "Impossible to make the search")) # called only status code isn't 200
if self.debug: print(f"Connected.")
if self.debug: print(f"Fetching results for {self.requested_app}...", end = " ")
topics = self.parse(reponse.text)
self.save(topics)
return topics, self.getInfos(session, topics)
def parse(self, htmlPage: str) -> list[dict]:
"""Parse HTML reponse to a clean list"""
if "No suitable matches were found." in htmlPage:
return []
elements = htmlPage.split("<tr>\n<td>")[1:]
elements[-1] = elements[-1].split("</td>\n</tr>")[0]
for i in range(0, len(elements)):
try:
_title = findall(r"class=\"topictitle\">(.*)<\/a>", elements[i])[0]
_title = sub(r" ?&amp; ?", " ", _title)
except:
_title = None
try:
_author = findall(r"(<br />|</strong>)\n\n?<i class=\"icon-user\"></i> by <a href=\"\./memberlist\.php\?mode=viewprofile&amp;u=\d+\"( style=\"color: #.*;\" class=\"username-coloured\")?>(.*)</a>", elements[i])[0][-1]
except:
_author = None
try:
_link = findall(r"\./viewtopic\.php\?f=(\d*)&amp;t=(\d*)&amp", elements[i])[0]
_link = {"f": _link[0], "t": _link[1]}
except:
_link = None
try:
_date = findall(r"</a> <i class=\"icon-time\"></i> <small>(.*)</small>", elements[i])[0]
except:
_date = None
print("\n" + elements[i] + "\n")
elements[i] = {"title": _title, "author": _author, "date": _date, "link": f"{self.url}/viewtopic.php?f={_link['f']}&t={_link['t']}", "linkParams": _link}
return elements
def getInfos(self, session: CloudScraper, elements: list) -> list:
"""Go to the first n pages and get a lot of infos"""
size = len(elements)
if size == 0:
return []
page = 3
if self.debug: print(f"Going to the {page} first pages...", end = " ")
results = []
for i in range(0, size):
if i < page:
reponse = session.get(f"{self.url}/viewtopic.php", params = elements[i]["linkParams"]) # fetch results page
results.append(reponse)
if reponse.status_code != 200:
raise ConnectionError(self.errorFormat(code = reponse.status_code, message = f"Error while doing the search n°{i}")) # called only status code isn't 200
if self.debug: print(f"Done.")
if self.debug: print(f"Parsing results page...", end = " ")
results = self.parsingInfos(results)
if self.debug: print(f"Done.")
return results
def parsingInfos(self, elements: list) -> list[dict]:
"""Parse infos from the page of the app"""
for i in range(0, len(elements)):
elements[i] = elements[i].text
if "Download Instructions" not in elements[i]:
elements[i] = {"changelogs": None, "downloadLinks": None}
continue
try:
_changelogs = findall(r"What's New:</span> ?<br />(.*)<br /><br /><span style=\"c|font-weight: bold\">T", elements[i])[0]
if len(_changelogs) < 2: # if result none, trying other method
_changelogs = findall(r"What's New:</span> ?<br />(.*)<br /><br /><span style=\"font-weight: bold\">T", elements[i])[0]
except:
_changelogs = "No changelog found."
try:
elements[i] = sub(r"Download Instructions:</span>(.*)?<br /><s", "Download Instructions:</span><br /><s", elements[i])
_downloadLinks = findall(r"Download Instructions:</span> ?<br />(.*|[\s\S]*)<br /><br />Trouble downloading|</a></div>", elements[i])[0]
if len(_downloadLinks) < 2:# if result none, trying other method
_downloadLinks = findall(r"Download Instructions:</span> ?<br />(.*|[\s\S]*)</a></div>", elements[i])[0]
except:
_downloadLinks = None
_downloadLinks = sub(r"\n|<a class=\"postlink\" href=\"|\(Closed Filehost\) ?|<span style=\"font-weight: bold\">|</span>|\">(\S*)</a>", "", _downloadLinks) # remove html garbage
_downloadLinks = sub(r"<br />\n?", "\n", _downloadLinks) # convert newline html to \n
_downloadLinks = sub(r"Mirrors(?!:)|Mirror(?!s)(?!:)", "Mirror:", _downloadLinks) # add ":"
_downloadLinks = _downloadLinks.split('">')[0]
elements[i] = {"changelogs": _changelogs, "downloadLinks": _downloadLinks}
return elements
def prettyPrint(self, topics: tuple[list[dict], list[dict]]) -> list:
"""Show a pretty message with all the specialized infos"""
topics, topicsInfos = topics
if len(topics) == 0:
return []
print("\n")
result = []
for i in range(0, len(topicsInfos)):
result.append({
"title": topics[i]["title"],
"author": topics[i]["author"],
"date": topics[i]["date"],
"changelogs": str(topicsInfos[i]["changelogs"]).replace("<br />", "\n"),
"downloadLinks": topicsInfos[i]["downloadLinks"]
})
print(f"Title: {result[i]['title']}\n")
print(f"Author: {result[i]['author']}\n")
print(f"Date of release: {result[i]['date']}\n")
print(f"Changelogs: \n{result[i]['changelogs']}\n")
print(f"Download links: \n{result[i]['downloadLinks']}")
print("\n\n---\n")
return result
def work(self) -> list:
"""Call all the others methods."""
return self.prettyPrint(self.search(self.connect()))
def save(self, elements: list) -> None:
"""Save all the results parsed to a CSV file."""
size = len(elements)
if size == 0:
print("No elements were found with the search.")
return
filename = "results.csv"
with open(filename, "w") as f:
topCSV = list(elements[0].keys()) # create a copy of the first element keys
topCSV.remove("linkParams") # remove linkParams
f.write(";".join(topCSV))
f.write("\n")
for element in elements:
if element != "linkParams":
f.write(";".join(str(e) for e in list(element.values())[:-1]))
f.write("\n")
print(f"{size} elements have been registered in the {filename} file.")
if __name__ == "__main__": if __name__ == "__main__":
MobiDL().run() argv = argv[1:]
if len(argv) < 1: # no args
print("No App to retrieve.")
exit(1)
load_dotenv() # load .env file
try:
try: # for logs
debug = environ["DEBUG_MOBILISM"].lower() in ("yes", "true", "1")
except:
debug = False
try: # try to fetch credentials from de .env first
pseudoMobilism = environ["PSEUDO_MOBILISM"]
passwordMobilism = environ["PASSWORD_MOBILISM"]
except: # if it failed try to get from the cli
if len(argv) >= 3:
pseudoMobilism = argv[0]
passwordMobilism = argv[1]
argv = argv[-2:]
else: # if it failed again there is a problem
raise KeyError
Scraper(pseudoMobilism, passwordMobilism, " ".join([n for n in argv]), debug).work() # call the work() function
except KeyError:
print('Please fill in the username and password (with quotes) by args or with .env file and give an app to retrieve.')

View file

@ -2,8 +2,3 @@
requests==2.26.0 requests==2.26.0
python-dotenv==0.19.0 python-dotenv==0.19.0
cloudscraper==1.2.58 cloudscraper==1.2.58
# gui
kivy[base]==2.0.0 # app core
buildozer==1.2.0 # app builder
Cython==0.29.19 # buildozer dependencie

View file

@ -1,202 +0,0 @@
from sys import argv
from os import environ
from dotenv import load_dotenv
from cloudscraper import CloudScraper, create_scraper
from re import findall, sub
class Scraper:
def __init__(self, pseudo: str, password: str, app: str, debug: bool = False):
self.debug = debug
self.url = "https://forum.mobilism.org"
self.requested_app = app
self.loginData = {
"username": pseudo,
"password": password,
"login": "Login"
}
def errorFormat(self, code: int = None, message: str = "") -> str:
"""Pretty error message."""
return f"{f'[{code}]' if code else ''}{' ' if len(message) > 0 and code else ''}{message}."
def connect(self) -> CloudScraper:
"""Login to the forum using credentials."""
session = create_scraper(browser = {"browser": "chrome", "platform": "windows"}) # connect with cloudflare bypasser with a chrome browser on windows
if not session:
raise SystemError(self.errorFormat(message = "The creation of the session failed")) # called only if failed at creating the session
if self.debug: print("Connection attempt...")
reponse = session.post(f"{self.url}/ucp.php", data = self.loginData, params = {"mode": "login"}) # connect to the forum using credentials - params are set by default but its in case forum changing that
if reponse.status_code != 200:
raise ConnectionRefusedError(self.errorFormat(code = reponse.status_code, message = "Unable to connect")) # called only status code isn't 200
return session
def search(self, session: CloudScraper) -> tuple[list[dict], list[dict]]:
"""Do the research."""
if self.debug: print("Going to search page and check connection...", end = " ")
reponse = session.get(f"{self.url}/search.php", params = {"keywords": self.requested_app, "sr": "topics", "sf": "titleonly"}) # fetch results page
if "Sorry but you are not permitted to use the search system. If you're not logged in please" in reponse.text:
raise ConnectionError(self.errorFormat(message = "Connection failed, check credentials")) # called only if login failed
if reponse.status_code != 200:
raise ConnectionError(self.errorFormat(code = reponse.status_code, message = "Impossible to make the search")) # called only status code isn't 200
if self.debug: print(f"Connected.")
if self.debug: print(f"Fetching results for {self.requested_app}...", end = " ")
topics = self.parse(reponse.text)
self.save(topics)
return topics, self.getInfos(session, topics)
def parse(self, htmlPage: str) -> list[dict]:
"""Parse HTML reponse to a clean list"""
if "No suitable matches were found." in htmlPage:
return []
elements = htmlPage.split("<tr>\n<td>")[1:]
elements[-1] = elements[-1].split("</td>\n</tr>")[0]
for i in range(0, len(elements)):
try:
_title = findall(r"class=\"topictitle\">(.*)<\/a>", elements[i])[0]
_title = sub(r" ?&amp; ?", " ", _title)
except:
_title = None
try:
_author = findall(r"(<br />|</strong>)\n\n?<i class=\"icon-user\"></i> by <a href=\"\./memberlist\.php\?mode=viewprofile&amp;u=\d+\"( style=\"color: #.*;\" class=\"username-coloured\")?>(.*)</a>", elements[i])[0][-1]
except:
_author = None
try:
_link = findall(r"\./viewtopic\.php\?f=(\d*)&amp;t=(\d*)&amp", elements[i])[0]
_link = {"f": _link[0], "t": _link[1]}
except:
_link = None
try:
_date = findall(r"</a> <i class=\"icon-time\"></i> <small>(.*)</small>", elements[i])[0]
except:
_date = None
print("\n" + elements[i] + "\n")
elements[i] = {"title": _title, "author": _author, "date": _date, "link": f"{self.url}/viewtopic.php?f={_link['f']}&t={_link['t']}", "linkParams": _link}
return elements
def getInfos(self, session: CloudScraper, elements: list) -> list:
"""Go to the first n pages and get a lot of infos"""
size = len(elements)
if size == 0:
return []
page = 3
if self.debug: print(f"Going to the {page} first pages...", end = " ")
results = []
for i in range(0, size):
if i < page:
reponse = session.get(f"{self.url}/viewtopic.php", params = elements[i]["linkParams"]) # fetch results page
results.append(reponse)
if reponse.status_code != 200:
raise ConnectionError(self.errorFormat(code = reponse.status_code, message = f"Error while doing the search n°{i}")) # called only status code isn't 200
if self.debug: print(f"Done.")
if self.debug: print(f"Parsing results page...", end = " ")
results = self.parsingInfos(results)
if self.debug: print(f"Done.")
return results
def parsingInfos(self, elements: list) -> list[dict]:
"""Parse infos from the page of the app"""
for i in range(0, len(elements)):
elements[i] = elements[i].text
if "Download Instructions" not in elements[i]:
elements[i] = {"changelogs": None, "downloadLinks": None}
continue
try:
_changelogs = findall(r"What's New:</span> ?<br />(.*)<br /><br /><span style=\"c|font-weight: bold\">T", elements[i])[0]
if len(_changelogs) < 2: # if result none, trying other method
_changelogs = findall(r"What's New:</span> ?<br />(.*)<br /><br /><span style=\"font-weight: bold\">T", elements[i])[0]
except:
_changelogs = "No changelog found."
try:
elements[i] = sub(r"Download Instructions:</span>(.*)?<br /><s", "Download Instructions:</span><br /><s", elements[i])
_downloadLinks = findall(r"Download Instructions:</span> ?<br />(.*|[\s\S]*)<br /><br />Trouble downloading|</a></div>", elements[i])[0]
if len(_downloadLinks) < 2:# if result none, trying other method
_downloadLinks = findall(r"Download Instructions:</span> ?<br />(.*|[\s\S]*)</a></div>", elements[i])[0]
except:
_downloadLinks = None
_downloadLinks = sub(r"\n|<a class=\"postlink\" href=\"|\(Closed Filehost\) ?|<span style=\"font-weight: bold\">|</span>|\">(\S*)</a>", "", _downloadLinks) # remove html garbage
_downloadLinks = sub(r"<br />\n?", "\n", _downloadLinks) # convert newline html to \n
_downloadLinks = sub(r"Mirrors(?!:)|Mirror(?!s)(?!:)", "Mirror:", _downloadLinks) # add ":"
_downloadLinks = _downloadLinks.split('">')[0]
elements[i] = {"changelogs": _changelogs, "downloadLinks": _downloadLinks}
return elements
def prettyPrint(self, topics: tuple[list[dict], list[dict]]) -> list:
"""Show a pretty message with all the specialized infos"""
topics, topicsInfos = topics
if len(topics) == 0:
return []
print("\n")
result = []
for i in range(0, len(topicsInfos)):
result.append({
"title": topics[i]["title"],
"author": topics[i]["author"],
"date": topics[i]["date"],
"changelogs": str(topicsInfos[i]["changelogs"]).replace("<br />", "\n"),
"downloadLinks": topicsInfos[i]["downloadLinks"]
})
print(f"Title: {result[i]['title']}\n")
print(f"Author: {result[i]['author']}\n")
print(f"Date of release: {result[i]['date']}\n")
print(f"Changelogs: \n{result[i]['changelogs']}\n")
print(f"Download links: \n{result[i]['downloadLinks']}")
print("\n\n---\n")
return result
def work(self) -> list:
"""Call all the others methods."""
return self.prettyPrint(self.search(self.connect()))
def save(self, elements: list) -> None:
"""Save all the results parsed to a CSV file."""
size = len(elements)
if size == 0:
print("No elements were found with the search.")
return
filename = "results.csv"
with open(filename, "w") as f:
topCSV = list(elements[0].keys()) # create a copy of the first element keys
topCSV.remove("linkParams") # remove linkParams
f.write(";".join(topCSV))
f.write("\n")
for element in elements:
if element != "linkParams":
f.write(";".join(str(e) for e in list(element.values())[:-1]))
f.write("\n")
print(f"{size} elements have been registered in the {filename} file.")
if __name__ == "__main__":
argv = argv[1:]
if len(argv) < 1: # no args
print("No App to retrieve.")
exit(1)
load_dotenv() # load .env file
try:
try: # for logs
debug = environ["DEBUG_MOBILISM"].lower() in ("yes", "true", "1")
except:
debug = False
try: # try to fetch credentials from de .env first
pseudoMobilism = environ["PSEUDO_MOBILISM"]
passwordMobilism = environ["PASSWORD_MOBILISM"]
except: # if it failed try to get from the cli
if len(argv) >= 3:
pseudoMobilism = argv[0]
passwordMobilism = argv[1]
argv = argv[-2:]
else: # if it failed again there is a problem
raise KeyError
Scraper(pseudoMobilism, passwordMobilism, " ".join([n for n in argv]), debug).work() # call the work() function
except KeyError:
print('Please fill in the username and password (with quotes) by args or with .env file and give an app to retrieve.')