mirror of
https://github.com/quatalog/quatalog.git
synced 2024-11-21 14:23:02 +00:00
Begin rewriting in C++
This commit is contained in:
commit
bd8f2dd43b
3
.gitmodules
vendored
Normal file
3
.gitmodules
vendored
Normal file
|
@ -0,0 +1,3 @@
|
|||
[submodule "3rdparty/jsoncpp"]
|
||||
path = 3rdparty/jsoncpp
|
||||
url = https://github.com/open-source-parsers/jsoncpp
|
1
3rdparty/jsoncpp
vendored
Submodule
1
3rdparty/jsoncpp
vendored
Submodule
|
@ -0,0 +1 @@
|
|||
Subproject commit 8190e061bc2d95da37479a638aa2c9e483e58ec6
|
131
CourseOfferingsScraper.cpp
Normal file
131
CourseOfferingsScraper.cpp
Normal file
|
@ -0,0 +1,131 @@
|
|||
#include<set>
|
||||
#include<regex>
|
||||
#include<fstream>
|
||||
#include<iostream>
|
||||
#include<filesystem>
|
||||
#include<dist/jsoncpp.cpp>
|
||||
|
||||
namespace fs = std::filesystem;
|
||||
void handle_term(const fs::directory_entry&,Json::Value&);
|
||||
void handle_course(const Json::Value&,const std::string&,Json::Value&);
|
||||
void handle_attribute(Json::Value&,const std::string&);
|
||||
|
||||
int main(const int argc,const char** argv) {
|
||||
if(argc < 2) {
|
||||
std::cerr << "Bad number of arguments " << argc << std::endl;
|
||||
return EXIT_FAILURE;
|
||||
}
|
||||
|
||||
const auto data_dir_path = fs::path(argv[1]);
|
||||
|
||||
if(!fs::is_directory(data_dir_path)) {
|
||||
std::cerr << "Data dir argument " << data_dir_path << " is not a directory" << std::endl;
|
||||
return EXIT_FAILURE;
|
||||
}
|
||||
|
||||
const auto data_dir = fs::directory_iterator(data_dir_path);
|
||||
|
||||
std::set<fs::directory_entry> term_dirs;
|
||||
for(const fs::directory_entry term : data_dir) {
|
||||
term_dirs.insert(term);
|
||||
}
|
||||
|
||||
Json::Value terms_offered;
|
||||
terms_offered["all_terms"] = Json::arrayValue;
|
||||
for(auto term : term_dirs) {
|
||||
if(!fs::is_directory(term)) {
|
||||
continue;
|
||||
}
|
||||
|
||||
handle_term(term,terms_offered);
|
||||
}
|
||||
|
||||
//std::cout << terms_offered["all_terms"] << std::endl;
|
||||
//std::cout << terms_offered["MATH-4020"] << std::endl;
|
||||
std::cout << terms_offered << std::endl;
|
||||
|
||||
return EXIT_SUCCESS;
|
||||
}
|
||||
|
||||
void handle_term(const fs::directory_entry& term_entry,
|
||||
Json::Value& terms_offered) {
|
||||
const fs::path dir = term_entry.path();
|
||||
const auto dirname = dir.string();
|
||||
const auto term = dir.stem().string();
|
||||
const auto courses_filename = dirname + "/courses.json";
|
||||
const auto prereqs_filename = dirname + "/prerequisites.json";
|
||||
std::fstream courses_file{courses_filename,std::ios::in};
|
||||
std::fstream prereqs_file{prereqs_filename,std::ios::in};
|
||||
|
||||
#ifdef DEBUG
|
||||
std::cerr << '\t' << courses_filename << std::endl;
|
||||
std::cerr << '\t' << prereqs_filename << std::endl;
|
||||
std::cerr << "Processing term " << term << "..." << std::endl;
|
||||
#endif
|
||||
terms_offered["all_terms"].append(term);
|
||||
|
||||
Json::Value courses;
|
||||
courses_file >> courses;
|
||||
for(auto prefix : courses) {
|
||||
#ifdef DEBUG
|
||||
std::cerr << "\tProcessing prefix "
|
||||
<< prefix["code"]
|
||||
<< " - "
|
||||
<< prefix["name"]
|
||||
<< "..."
|
||||
<< std::endl;
|
||||
#endif
|
||||
for(auto course : prefix["courses"]) {
|
||||
handle_course(course,term,terms_offered);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
void handle_course(const Json::Value& course,const std::string& term,Json::Value& terms_offered) {
|
||||
const auto course_code = course["id"].asString();
|
||||
auto& course_term = terms_offered[course_code][term];
|
||||
course_term["title"] = course["title"];
|
||||
|
||||
int credMin = Json::Value::maxInt;
|
||||
int credMax = 0;
|
||||
for(auto section : course["sections"]) {
|
||||
credMin = std::min(credMin,section["credMin"].asInt());
|
||||
credMax = std::max(credMax,section["credMax"].asInt());
|
||||
}
|
||||
course_term["credMin"] = credMin;
|
||||
course_term["credMax"] = credMax;
|
||||
|
||||
const auto section = course["sections"][0];
|
||||
|
||||
const auto delim = std::regex(" and |, ");
|
||||
const auto attributes_str = section["attribute"].asString();
|
||||
const auto end_itr = std::sregex_token_iterator();
|
||||
|
||||
auto attributes_itr = std::sregex_token_iterator(
|
||||
attributes_str.begin(),
|
||||
attributes_str.end(),
|
||||
delim,-1);
|
||||
while(attributes_itr != end_itr
|
||||
&& !attributes_itr->str().empty()) {
|
||||
handle_attribute(course_term,attributes_itr->str());
|
||||
attributes_itr++;
|
||||
}
|
||||
}
|
||||
|
||||
void handle_attribute(Json::Value& course_term,const std::string& attribute) {
|
||||
std::string attr;
|
||||
if(attribute == "Communication Intensive") {
|
||||
attr = "[CI]";
|
||||
} else if(attribute == "Writing Intensive") {
|
||||
attr = "[WI]";
|
||||
} else if(attribute == "HASS Inquiry") {
|
||||
attr = "[HInq]";
|
||||
} else if(attribute == "Culminating Exp/Capstone") {
|
||||
attr = "[CulmExp]";
|
||||
} else if(attribute == "PDII Option for Engr Majors") {
|
||||
attr = "[PDII]";
|
||||
}
|
||||
if(!attr.empty()) {
|
||||
course_term["attributes"].append(attr);
|
||||
}
|
||||
}
|
Loading…
Reference in a new issue