├── .gitignore ├── README.md ├── combined_ranking_cs_2023.tsv ├── combined_ranking_math_2023.tsv ├── normalize.py ├── scraper ├── data_scraped │ ├── arwu.jsonl │ ├── arwu_math_2023.jsonl │ ├── qs.jsonl │ ├── qs_math_2023.jsonl │ ├── the.jsonl │ └── the_math_2023.jsonl ├── scraper │ ├── __init__.py │ ├── items.py │ ├── middlewares.py │ ├── pipelines.py │ ├── settings.py │ └── spiders │ │ ├── __init__.py │ │ ├── arwu.py │ │ ├── qs.py │ │ └── the.py └── scrapy.cfg ├── top-10-universities-cs-2023.png ├── top-10-universities-math-2023.png └── top_unis.ipynb /.gitignore: -------------------------------------------------------------------------------- 1 | .ipynb_checkpoints/ 2 | __pycache__/ 3 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/README.md -------------------------------------------------------------------------------- /combined_ranking_cs_2023.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/combined_ranking_cs_2023.tsv -------------------------------------------------------------------------------- /combined_ranking_math_2023.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/combined_ranking_math_2023.tsv -------------------------------------------------------------------------------- /normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/normalize.py -------------------------------------------------------------------------------- /scraper/data_scraped/arwu.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/data_scraped/arwu.jsonl -------------------------------------------------------------------------------- /scraper/data_scraped/arwu_math_2023.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/data_scraped/arwu_math_2023.jsonl -------------------------------------------------------------------------------- /scraper/data_scraped/qs.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/data_scraped/qs.jsonl -------------------------------------------------------------------------------- /scraper/data_scraped/qs_math_2023.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/data_scraped/qs_math_2023.jsonl -------------------------------------------------------------------------------- /scraper/data_scraped/the.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/data_scraped/the.jsonl -------------------------------------------------------------------------------- /scraper/data_scraped/the_math_2023.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/data_scraped/the_math_2023.jsonl -------------------------------------------------------------------------------- /scraper/scraper/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scraper/scraper/items.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/scraper/items.py -------------------------------------------------------------------------------- /scraper/scraper/middlewares.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/scraper/middlewares.py -------------------------------------------------------------------------------- /scraper/scraper/pipelines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/scraper/pipelines.py -------------------------------------------------------------------------------- /scraper/scraper/settings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/scraper/settings.py -------------------------------------------------------------------------------- /scraper/scraper/spiders/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/scraper/spiders/__init__.py -------------------------------------------------------------------------------- /scraper/scraper/spiders/arwu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/scraper/spiders/arwu.py -------------------------------------------------------------------------------- /scraper/scraper/spiders/qs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/scraper/spiders/qs.py -------------------------------------------------------------------------------- /scraper/scraper/spiders/the.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/scraper/spiders/the.py -------------------------------------------------------------------------------- /scraper/scrapy.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/scraper/scrapy.cfg -------------------------------------------------------------------------------- /top-10-universities-cs-2023.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/top-10-universities-cs-2023.png -------------------------------------------------------------------------------- /top-10-universities-math-2023.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/top-10-universities-math-2023.png -------------------------------------------------------------------------------- /top_unis.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/manocormen/top-universities/HEAD/top_unis.ipynb --------------------------------------------------------------------------------