2022-08-16 14:05:25 +02:00
|
|
|
use chrono::{Datelike, Duration, TimeZone, Utc};
|
2022-08-16 10:41:42 +02:00
|
|
|
use regex::Regex;
|
2022-08-16 11:57:36 +02:00
|
|
|
use scraper::{Html, Selector};
|
2022-08-16 10:41:42 +02:00
|
|
|
|
2022-08-15 19:20:04 +02:00
|
|
|
pub mod models;
|
2022-08-15 12:18:08 +02:00
|
|
|
|
2022-08-15 17:25:14 +02:00
|
|
|
/// Fetch the timetable for a class
|
2022-08-15 20:09:41 +02:00
|
|
|
pub async fn timetable(
|
|
|
|
year: i8,
|
|
|
|
semester: i8,
|
|
|
|
letter: Option<char>,
|
2022-08-16 09:33:35 +02:00
|
|
|
) -> (Vec<String>, (usize, Vec<models::Day>)) {
|
2022-08-15 14:52:57 +02:00
|
|
|
let document = get_webpage(year, semester, letter)
|
|
|
|
.await
|
|
|
|
.expect("Can't reach timetable website.");
|
2022-08-15 12:18:08 +02:00
|
|
|
|
|
|
|
// Selectors
|
|
|
|
let sel_table = Selector::parse("table").unwrap();
|
|
|
|
let sel_tr = Selector::parse("tr").unwrap();
|
|
|
|
let sel_tbody = Selector::parse("tbody").unwrap();
|
|
|
|
let sel_th = Selector::parse("th").unwrap();
|
|
|
|
let sel_td = Selector::parse("td").unwrap();
|
|
|
|
let sel_em = Selector::parse("em").unwrap();
|
|
|
|
let sel_small = Selector::parse("small").unwrap();
|
|
|
|
let sel_strong = Selector::parse("strong").unwrap();
|
|
|
|
|
|
|
|
// Find the timetable
|
2022-08-15 12:23:01 +02:00
|
|
|
let raw_timetable = document.select(&sel_table).next().unwrap();
|
2022-08-15 12:18:08 +02:00
|
|
|
|
|
|
|
// Find the slots available for the timetable
|
|
|
|
let raw_schedules = raw_timetable.select(&sel_tr).next().unwrap();
|
|
|
|
|
|
|
|
// Find availables schedules
|
|
|
|
let mut schedules = Vec::new();
|
|
|
|
for time in raw_schedules.select(&sel_th) {
|
|
|
|
schedules.push(time.inner_html());
|
|
|
|
}
|
|
|
|
|
|
|
|
// Find the timetable values
|
|
|
|
let raw_timetable_values = raw_timetable.select(&sel_tbody).next().unwrap();
|
|
|
|
|
|
|
|
// For each days
|
|
|
|
let mut timetable = Vec::new();
|
|
|
|
for day in raw_timetable_values.select(&sel_tr) {
|
|
|
|
let mut courses_vec = Vec::new();
|
|
|
|
let mut location_tracker = 0;
|
|
|
|
for course in day.select(&sel_td) {
|
|
|
|
if course.inner_html() == "—" {
|
|
|
|
courses_vec.push(None);
|
|
|
|
location_tracker += 1;
|
|
|
|
} else {
|
|
|
|
courses_vec.push(Some(models::Course {
|
|
|
|
name: course.select(&sel_em).next().unwrap().inner_html(),
|
|
|
|
professor: match course
|
|
|
|
.select(&sel_small)
|
|
|
|
.next()
|
|
|
|
.unwrap()
|
|
|
|
.inner_html()
|
|
|
|
.split("<br>")
|
|
|
|
.next()
|
|
|
|
{
|
|
|
|
Some(data) => {
|
|
|
|
if data.contains("</strong>") {
|
|
|
|
// This is the room, so there is no professor assigned
|
|
|
|
// to this courses yet
|
|
|
|
None
|
|
|
|
} else {
|
|
|
|
Some(data.to_string())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
None => None,
|
|
|
|
},
|
|
|
|
room: course
|
|
|
|
.select(&sel_strong)
|
|
|
|
.next()
|
|
|
|
.unwrap()
|
|
|
|
.inner_html()
|
|
|
|
.replace("<br>", ""),
|
|
|
|
start: location_tracker,
|
|
|
|
size: match course.value().attr("colspan") {
|
|
|
|
Some(i) => i.parse().unwrap(),
|
|
|
|
None => 1,
|
|
|
|
},
|
2022-08-16 11:57:36 +02:00
|
|
|
dtstart: None,
|
|
|
|
dtend: None,
|
2022-08-15 12:18:08 +02:00
|
|
|
}));
|
|
|
|
|
|
|
|
match &courses_vec[courses_vec.len() - 1] {
|
|
|
|
Some(course) => location_tracker += course.size,
|
|
|
|
None => location_tracker += 1,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
timetable.push(models::Day {
|
|
|
|
name: day.select(&sel_th).next().unwrap().inner_html(),
|
|
|
|
courses: courses_vec,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
if !check_consistency(&schedules, &timetable) {
|
|
|
|
panic!("Error when building the timetable.");
|
|
|
|
}
|
|
|
|
|
2022-08-16 09:33:35 +02:00
|
|
|
(schedules, (semester as usize, timetable))
|
2022-08-15 12:18:08 +02:00
|
|
|
}
|
|
|
|
|
2022-08-15 17:25:14 +02:00
|
|
|
/// Get timetable webpage
|
2022-08-15 12:18:08 +02:00
|
|
|
async fn get_webpage(
|
|
|
|
year: i8,
|
|
|
|
semester: i8,
|
|
|
|
letter: Option<char>,
|
|
|
|
) -> Result<Html, Box<dyn std::error::Error>> {
|
|
|
|
/* let url = {
|
|
|
|
let panic_semester_message = "Unknown semester.";
|
|
|
|
let panic_letter_message = "Unknown letter.";
|
|
|
|
|
|
|
|
let base_url = "https://informatique.up8.edu/licence-iv/edt";
|
|
|
|
match year {
|
|
|
|
1 => {
|
|
|
|
let allow_letters = match semester {
|
|
|
|
1 => ['a', 'b', 'c'],
|
|
|
|
2 => ['x', 'y', 'z'],
|
|
|
|
_ => panic!("{}", panic_semester_message),
|
|
|
|
};
|
|
|
|
let c = letter.expect(panic_letter_message);
|
|
|
|
if allow_letters.contains(&c) {
|
|
|
|
format!("{}/l1-{}.html", base_url, c)
|
|
|
|
} else {
|
|
|
|
panic!("{}", panic_letter_message)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
2 => {
|
|
|
|
let allow_letters = match semester {
|
|
|
|
1 => ['a', 'b'],
|
|
|
|
2 => ['x', 'y'],
|
|
|
|
_ => panic!("{}", panic_semester_message),
|
|
|
|
};
|
|
|
|
let c = letter.expect(panic_letter_message);
|
|
|
|
if allow_letters.contains(&c) {
|
|
|
|
format!("{}/l2-{}.html", base_url, c)
|
|
|
|
} else {
|
|
|
|
panic!("{}", panic_letter_message)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
3 => match semester {
|
|
|
|
1 => format!("{}/l3.html", base_url),
|
|
|
|
2 => format!("{}/l3_2.html", base_url),
|
|
|
|
_ => panic!("{}", panic_semester_message),
|
|
|
|
},
|
|
|
|
_ => panic!("Unknown year."),
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
// Get raw html
|
|
|
|
let html = reqwest::get(url).await?.text().await?;
|
|
|
|
|
|
|
|
// Parse document
|
|
|
|
let document = Html::parse_document(&html); */
|
|
|
|
|
|
|
|
println!("Fetch 'L{}{} (s{})'", year, letter.unwrap_or(' '), semester);
|
|
|
|
let html = include_str!("../target/debug.html");
|
|
|
|
let document = Html::parse_document(html);
|
|
|
|
|
|
|
|
Ok(document)
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Check if the timetable is well built
|
|
|
|
fn check_consistency(schedules: &Vec<String>, timetable: &Vec<models::Day>) -> bool {
|
|
|
|
let mut checker = true;
|
|
|
|
for day in timetable {
|
|
|
|
let mut i = 0;
|
|
|
|
for course in &day.courses {
|
|
|
|
match course {
|
|
|
|
Some(course_it) => {
|
|
|
|
// Checks the consistency of course start times
|
|
|
|
if i != course_it.start {
|
|
|
|
checker = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
// Keep the track of how many courses are in the day
|
|
|
|
i += course_it.size
|
|
|
|
}
|
|
|
|
None => i += 1,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// The counter should be the same as the amount of possible hours of the day
|
|
|
|
if i != schedules.len() {
|
|
|
|
checker = false;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
checker
|
|
|
|
}
|
2022-08-16 10:41:42 +02:00
|
|
|
|
2022-08-16 11:57:36 +02:00
|
|
|
// Data builded in the timetable webpage
|
2022-08-16 10:41:42 +02:00
|
|
|
type T = (
|
|
|
|
// Schedules
|
|
|
|
Vec<String>,
|
|
|
|
// Timetable per days with the semester as the key
|
2022-08-16 11:57:36 +02:00
|
|
|
(usize, Vec<models::Day>),
|
2022-08-16 10:41:42 +02:00
|
|
|
);
|
2022-08-16 11:57:36 +02:00
|
|
|
// Data builded in the info webpage
|
2022-08-16 10:41:42 +02:00
|
|
|
type D = std::collections::HashMap<
|
2022-08-16 11:57:36 +02:00
|
|
|
// Semester
|
2022-08-16 10:41:42 +02:00
|
|
|
usize,
|
2022-08-16 14:41:51 +02:00
|
|
|
// List of start and repetition of course weeks
|
|
|
|
Vec<(chrono::DateTime<Utc>, i64)>,
|
2022-08-16 10:41:42 +02:00
|
|
|
>;
|
|
|
|
|
|
|
|
/// Build the timetable
|
2022-08-16 11:57:36 +02:00
|
|
|
pub fn build(timetable: T, dates: D) -> Vec<models::Course> {
|
2022-08-16 10:41:42 +02:00
|
|
|
let mut schedules = Vec::new();
|
|
|
|
// h1 => heure de début | m1 => minute de début
|
|
|
|
// h2 => heure de fin | m2 => minute de fin
|
|
|
|
let re =
|
|
|
|
Regex::new(r"(?P<h1>\d{1,2})h(?P<m1>\d{1,2})?.(?P<h2>\d{1,2})h(?P<m2>\d{1,2})?").unwrap();
|
|
|
|
for hour in timetable.0 {
|
|
|
|
let captures = re.captures(&hour).unwrap();
|
|
|
|
|
|
|
|
let h1 = match captures.name("h1") {
|
|
|
|
Some(h) => h.as_str().parse().unwrap(),
|
|
|
|
None => 0,
|
|
|
|
};
|
|
|
|
let m1 = match captures.name("m1") {
|
|
|
|
Some(h) => h.as_str().parse().unwrap(),
|
|
|
|
None => 0,
|
|
|
|
};
|
|
|
|
let h2 = match captures.name("h2") {
|
|
|
|
Some(h) => h.as_str().parse().unwrap(),
|
|
|
|
None => 0,
|
|
|
|
};
|
|
|
|
let m2 = match captures.name("m2") {
|
|
|
|
Some(h) => h.as_str().parse().unwrap(),
|
|
|
|
None => 0,
|
|
|
|
};
|
|
|
|
schedules.push(((h1, m1), (h2, m2)));
|
|
|
|
}
|
|
|
|
|
2022-08-16 14:05:25 +02:00
|
|
|
// Store all the courses for the semester
|
|
|
|
let mut semester = Vec::new();
|
2022-08-16 10:41:42 +02:00
|
|
|
|
2022-08-16 14:05:25 +02:00
|
|
|
// Start date of the back-to-school week
|
2022-08-16 14:41:51 +02:00
|
|
|
let data = dates.get(&timetable.1 .0).unwrap().get(0).unwrap();
|
|
|
|
let mut date = data.0;
|
|
|
|
// For each weeks
|
|
|
|
for _ in 0..(data.1) {
|
|
|
|
for day in &timetable.1 .1 {
|
|
|
|
for mut course in day.courses.clone().into_iter().flatten() {
|
|
|
|
// Get the hours
|
|
|
|
let start = schedules.get(course.start).unwrap().0;
|
|
|
|
// -1 because we only add when the size is > 1
|
|
|
|
let end = schedules.get(course.start + course.size - 1).unwrap().1;
|
2022-08-16 10:41:42 +02:00
|
|
|
|
2022-08-16 14:41:51 +02:00
|
|
|
// Add the changed datetimes
|
|
|
|
course.dtstart = Some(
|
|
|
|
Utc.ymd(date.year(), date.month(), date.day())
|
|
|
|
.and_hms(start.0, start.1, 0),
|
|
|
|
);
|
|
|
|
course.dtend = Some(
|
|
|
|
Utc.ymd(date.year(), date.month(), date.day())
|
|
|
|
.and_hms(end.0, end.1, 0),
|
|
|
|
);
|
2022-08-16 10:41:42 +02:00
|
|
|
|
2022-08-16 14:41:51 +02:00
|
|
|
semester.push(course);
|
|
|
|
}
|
|
|
|
date += Duration::days(1);
|
2022-08-16 14:05:25 +02:00
|
|
|
}
|
2022-08-16 14:41:51 +02:00
|
|
|
// From friday to monday
|
|
|
|
date += Duration::days(2);
|
2022-08-16 14:05:25 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
semester
|
2022-08-16 10:41:42 +02:00
|
|
|
}
|