pusk/bin/main.ml

88 lines
2.7 KiB
OCaml
Raw Normal View History

2023-05-12 10:51:39 +02:00
open Lwt.Syntax
open Cohttp_lwt
open Cohttp_lwt_unix
let fmt = Printf.sprintf
2023-05-12 18:40:47 +02:00
let rec download uri dest =
2023-05-12 10:51:39 +02:00
let* response, body = Client.get uri in
let status = Response.status response in
2023-05-12 18:40:47 +02:00
let code = Cohttp.Code.code_of_status status in
if Cohttp.Code.is_redirection code
2023-05-12 10:51:39 +02:00
then (
2023-05-12 18:40:47 +02:00
let headers = Response.headers response in
match Cohttp.Header.get headers "location" with
| Some url ->
let uri = Uri.of_string url in
let redirect_url = Uri.resolve "" uri uri in
download redirect_url dest
| None -> Lwt.fail_with "Redirect location not found")
else if Cohttp.Code.is_success code
then (
print_endline "Downloading...";
2023-05-12 10:51:39 +02:00
let stream = Body.to_stream body in
2023-05-12 18:40:47 +02:00
let res =
Lwt_io.with_file ~mode:Lwt_io.output dest (fun chan ->
Lwt_stream.iter_s (Lwt_io.write chan) stream)
in
let* () = res in
print_endline "Download done!";
Lwt.return_unit)
2023-05-12 10:51:39 +02:00
else
Lwt.fail_with
("Failed to download file. HTTP status: " ^ Cohttp.Code.string_of_status status)
;;
let download_selenium version =
let url =
format_of_string
"https://github.com/SeleniumHQ/selenium/releases/download/selenium-%s/selenium-server-%s.jar"
in
download (Uri.of_string (fmt url version version)) (fmt "./selenium-%s.jar" version)
;;
2023-05-12 19:36:27 +02:00
let download_gecko_driver version output =
let url =
format_of_string
"https://github.com/mozilla/geckodriver/releases/download/v%s/geckodriver-v%s-linux64.tar.gz"
in
download (Uri.of_string (fmt url version version)) output
;;
let run_program_in_background program args =
let pid = Unix.fork () in
match pid with
| 0 ->
(* Child process *)
let dev_null = Unix.openfile "/dev/null" [ O_WRONLY ] 0o666 in
Unix.dup2 dev_null Unix.stdout;
Unix.dup2 dev_null Unix.stderr;
Unix.close dev_null;
Unix.execvp program (Array.of_list (program :: args))
| _ -> pid (* Parent process *)
;;
let () =
(* Selenium *)
let version_selenium = "4.9.0" in
let selenium = fmt "selenium-%s.jar" version_selenium in
if not (Sys.file_exists selenium) then Lwt_main.run (download_selenium version_selenium);
(* Gecko Driver *)
let driver = fmt "geckodriver" in
if not (Sys.file_exists driver)
then (
let version_driver = "0.33.0" in
let archive = fmt "./gecko-%s.tar.gz" version_driver in
Lwt_main.run (download_gecko_driver version_driver archive);
let _ = Sys.command (fmt "tar xvzf %s" archive) in
());
let selenium_pid =
run_program_in_background "java" [ fmt "-jar %s" selenium; "standalone" ]
in
print_endline (fmt "Java running in %d" selenium_pid);
let closed_pid, _ = Unix.waitpid [] selenium_pid in
if not (closed_pid = selenium_pid)
then print_endline "WTF???"
else print_endline (fmt "Program %d closed!" closed_pid)
;;