├── .gitignore ├── CODEOWNERS ├── LICENSE.md ├── README.md ├── assets └── test_subsample_indices │ ├── arxiv │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── bibliotik │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── commoncrawl │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── dm-mathematics │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── enron │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── europarl │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── freelaw │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── github │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── gutenberg │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── hackernews │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── nih-exporter │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── opensubtitles │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── openwebtext2 │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── pubmed-abstracts │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── pubmed-central │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── stackexchange │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── uspto │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ ├── wikipedia │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json │ └── youtubesubtitles │ ├── group0.json │ ├── group1.json │ ├── group2.json │ ├── group3.json │ ├── group4.json │ ├── group5.json │ ├── group6.json │ ├── group7.json │ ├── group8.json │ └── group9.json ├── lm_perplexity ├── __init__.py ├── compute_perplexity.py ├── models.py ├── save_lm_perplexity_data.py └── utils.py ├── preset_configs ├── gpt2_large.json ├── gpt2_medium.json ├── gpt2_small.json ├── gpt2_xl.json ├── gpt3_ada.json ├── gpt3_babbage.json ├── gpt3_curie.json └── gpt3_davinci.json ├── scripts └── export_test_splits.py └── tests ├── __init__.py └── test_utils.py /.gitignore: -------------------------------------------------------------------------------- 1 | # Byte-compiled / optimized / DLL files 2 | __pycache__/ 3 | *.py[cod] 4 | *$py.class 5 | 6 | # C extensions 7 | *.so 8 | 9 | # Distribution / packaging 10 | .Python 11 | build/ 12 | develop-eggs/ 13 | dist/ 14 | downloads/ 15 | eggs/ 16 | .eggs/ 17 | lib/ 18 | lib64/ 19 | parts/ 20 | sdist/ 21 | var/ 22 | wheels/ 23 | pip-wheel-metadata/ 24 | share/python-wheels/ 25 | *.egg-info/ 26 | .installed.cfg 27 | *.egg 28 | MANIFEST 29 | 30 | # PyInstaller 31 | # Usually these files are written by a python script from a template 32 | # before PyInstaller builds the exe, so as to inject date/other infos into it. 33 | *.manifest 34 | *.spec 35 | 36 | # Installer logs 37 | pip-log.txt 38 | pip-delete-this-directory.txt 39 | 40 | # Unit test / coverage reports 41 | htmlcov/ 42 | .tox/ 43 | .nox/ 44 | .coverage 45 | .coverage.* 46 | .cache 47 | nosetests.xml 48 | coverage.xml 49 | *.cover 50 | *.py,cover 51 | .hypothesis/ 52 | .pytest_cache/ 53 | 54 | # Translations 55 | *.mo 56 | *.pot 57 | 58 | # Django stuff: 59 | *.log 60 | local_settings.py 61 | db.sqlite3 62 | db.sqlite3-journal 63 | 64 | # Flask stuff: 65 | instance/ 66 | .webassets-cache 67 | 68 | # Scrapy stuff: 69 | .scrapy 70 | 71 | # Sphinx documentation 72 | docs/_build/ 73 | 74 | # PyBuilder 75 | target/ 76 | 77 | # Jupyter Notebook 78 | .ipynb_checkpoints 79 | 80 | # IPython 81 | profile_default/ 82 | ipython_config.py 83 | 84 | # pyenv 85 | .python-version 86 | 87 | # pipenv 88 | # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. 89 | # However, in case of collaboration, if having platform-specific dependencies or dependencies 90 | # having no cross-platform support, pipenv may install dependencies that don't work, or not 91 | # install all needed dependencies. 92 | #Pipfile.lock 93 | 94 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow 95 | __pypackages__/ 96 | 97 | # Celery stuff 98 | celerybeat-schedule 99 | celerybeat.pid 100 | 101 | # SageMath parsed files 102 | *.sage.py 103 | 104 | # Environments 105 | .env 106 | .venv 107 | env/ 108 | venv/ 109 | ENV/ 110 | env.bak/ 111 | venv.bak/ 112 | 113 | # Spyder project settings 114 | .spyderproject 115 | .spyproject 116 | 117 | # Rope project settings 118 | .ropeproject 119 | 120 | # mkdocs documentation 121 | /site 122 | 123 | # mypy 124 | .mypy_cache/ 125 | .dmypy.json 126 | dmypy.json 127 | 128 | # Pyre type checker 129 | .pyre/ 130 | -------------------------------------------------------------------------------- /CODEOWNERS: -------------------------------------------------------------------------------- 1 | * EleutherAI/pm-pile -------------------------------------------------------------------------------- /LICENSE.md: -------------------------------------------------------------------------------- 1 | MIT License 2 | 3 | Copyright (c) 2020 EleutherAI 4 | 5 | Permission is hereby granted, free of charge, to any person obtaining a copy 6 | of this software and associated documentation files (the "Software"), to deal 7 | in the Software without restriction, including without limitation the rights 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 | copies of the Software, and to permit persons to whom the Software is 10 | furnished to do so, subject to the following conditions: 11 | 12 | The above copyright notice and this permission notice shall be included in all 13 | copies or substantial portions of the Software. 14 | 15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21 | SOFTWARE. 22 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # lm_perplexity 2 | 3 | Code for benchmarking language models with the Pile. 4 | 5 | ## Usage 6 | 7 | Evaluating on GPT-2 (uses GPU): 8 | 9 | ```bash 10 | # Compute intermediate outputs for calculating perplexity (e.g. logprobs) 11 | python lm_perplexity/save_lm_perplexity_data.py \ 12 | --model_config_path preset_configs/gpt2_medium.json \ 13 | --data_path /path/to/mydata.jsonl.zst \ 14 | --output_path /path/to/perplexity_data.p 15 | 16 | # Use intermediate outputs to compute perplexity 17 | python lm_perplexity/compute_perplexity.py \ 18 | --perplexity_data_path /path/to/perplexity_data.p \ 19 | --output_path /path/to/perplexity.json 20 | ``` 21 | 22 | Evaluating on GPT-3 (requires OpenAI API key): 23 | 24 | ```bash 25 | # Compute intermediate outputs for calculating perplexity (e.g. logprobs) 26 | export OPENAI_API_SECRET_KEY=YOUR_KEY_HERE 27 | python lm_perplexity/run_lm_perplexity.py \ 28 | --model_config_path preset_configs/gpt3_curie.json \ 29 | --data_path /path/to/mydata.jsonl.zst \ 30 | --output_path /path/to/perplexity_data.p 31 | 32 | # Use intermediate outputs to compute perplexity 33 | python lm_perplexity/compute_perplexity.py \ 34 | --perplexity_data_path /path/to/perplexity_data.p \ 35 | --output_path /path/to/perplexity.json 36 | ``` 37 | 38 | ## Assets 39 | 40 | JSON files in `assets/${DATASET}/group${GROUP_ID}.json` contain the document indices for the canonical one-tenth split of the test set. Evaluation in the paper were performed on `group0`. 41 | 42 | ## Requirements 43 | 44 | * numpy 45 | * torch 46 | * transformers 47 | * openai 48 | * lm_dataformat 49 | * tqdm -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 22, 3 | 25, 4 | 60, 5 | 61, 6 | 63, 7 | 64, 8 | 76, 9 | 84, 10 | 95, 11 | 99, 12 | 106, 13 | 118, 14 | 123, 15 | 133, 16 | 140, 17 | 141, 18 | 142, 19 | 148, 20 | 157, 21 | 168, 22 | 180, 23 | 193, 24 | 208, 25 | 211, 26 | 221, 27 | 234, 28 | 249, 29 | 300, 30 | 310, 31 | 311, 32 | 321, 33 | 322, 34 | 335, 35 | 393, 36 | 403, 37 | 408, 38 | 422, 39 | 426, 40 | 494, 41 | 504, 42 | 505, 43 | 515, 44 | 520, 45 | 525, 46 | 526, 47 | 538, 48 | 545, 49 | 548, 50 | 552, 51 | 556, 52 | 558, 53 | 565, 54 | 567, 55 | 568, 56 | 580, 57 | 583, 58 | 591, 59 | 597, 60 | 611, 61 | 622, 62 | 655, 63 | 677, 64 | 699, 65 | 708, 66 | 709, 67 | 720, 68 | 725, 69 | 727, 70 | 730, 71 | 756, 72 | 788, 73 | 794, 74 | 805, 75 | 807, 76 | 808, 77 | 810, 78 | 821, 79 | 834, 80 | 857, 81 | 859, 82 | 870, 83 | 892, 84 | 898, 85 | 900, 86 | 901, 87 | 922, 88 | 926, 89 | 932, 90 | 937, 91 | 939, 92 | 970, 93 | 983, 94 | 1002, 95 | 1013, 96 | 1023, 97 | 1025, 98 | 1028, 99 | 1042, 100 | 1063, 101 | 1076, 102 | 1082, 103 | 1084, 104 | 1102, 105 | 1126, 106 | 1127, 107 | 1131, 108 | 1139, 109 | 1146, 110 | 1150, 111 | 1153, 112 | 1155, 113 | 1161, 114 | 1165, 115 | 1167, 116 | 1179, 117 | 1194, 118 | 1206, 119 | 1210, 120 | 1219, 121 | 1220, 122 | 1222, 123 | 1226, 124 | 1242, 125 | 1248, 126 | 1259, 127 | 1268, 128 | 1301, 129 | 1312, 130 | 1315, 131 | 1334, 132 | 1342, 133 | 1344, 134 | 1351, 135 | 1353, 136 | 1369, 137 | 1384, 138 | 1393, 139 | 1397, 140 | 1398, 141 | 1399, 142 | 1469, 143 | 1471, 144 | 1481, 145 | 1484, 146 | 1512, 147 | 1537, 148 | 1547, 149 | 1557, 150 | 1570, 151 | 1572, 152 | 1596, 153 | 1603, 154 | 1606, 155 | 1607, 156 | 1613, 157 | 1614, 158 | 1624, 159 | 1628, 160 | 1633, 161 | 1640, 162 | 1645, 163 | 1656, 164 | 1705, 165 | 1708, 166 | 1710, 167 | 1718, 168 | 1734, 169 | 1741, 170 | 1748, 171 | 1773, 172 | 1780, 173 | 1790, 174 | 1802, 175 | 1812, 176 | 1815, 177 | 1840, 178 | 1858, 179 | 1869, 180 | 1872, 181 | 1874, 182 | 1886, 183 | 1898, 184 | 1932, 185 | 1943, 186 | 1946, 187 | 1947, 188 | 1966, 189 | 1971, 190 | 1973, 191 | 1999, 192 | 2008, 193 | 2013, 194 | 2014, 195 | 2020, 196 | 2027, 197 | 2030, 198 | 2038, 199 | 2042, 200 | 2051, 201 | 2056, 202 | 2070, 203 | 2081, 204 | 2092, 205 | 2109, 206 | 2110, 207 | 2117, 208 | 2126, 209 | 2144, 210 | 2157, 211 | 2162, 212 | 2164, 213 | 2177, 214 | 2203, 215 | 2215, 216 | 2217, 217 | 2227, 218 | 2259, 219 | 2260, 220 | 2267, 221 | 2272, 222 | 2279, 223 | 2291, 224 | 2295, 225 | 2302, 226 | 2321, 227 | 2323, 228 | 2325, 229 | 2359, 230 | 2366, 231 | 2367, 232 | 2369, 233 | 2370, 234 | 2378, 235 | 2380, 236 | 2382, 237 | 2387, 238 | 2404, 239 | 2405 240 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 10, 4 | 11, 5 | 42, 6 | 46, 7 | 48, 8 | 56, 9 | 67, 10 | 91, 11 | 104, 12 | 122, 13 | 129, 14 | 147, 15 | 154, 16 | 163, 17 | 167, 18 | 171, 19 | 176, 20 | 181, 21 | 183, 22 | 216, 23 | 227, 24 | 229, 25 | 231, 26 | 238, 27 | 243, 28 | 256, 29 | 268, 30 | 277, 31 | 291, 32 | 308, 33 | 320, 34 | 324, 35 | 336, 36 | 339, 37 | 350, 38 | 353, 39 | 366, 40 | 369, 41 | 372, 42 | 390, 43 | 395, 44 | 398, 45 | 404, 46 | 423, 47 | 430, 48 | 437, 49 | 454, 50 | 460, 51 | 462, 52 | 465, 53 | 466, 54 | 508, 55 | 513, 56 | 533, 57 | 560, 58 | 572, 59 | 587, 60 | 595, 61 | 609, 62 | 613, 63 | 617, 64 | 623, 65 | 637, 66 | 644, 67 | 647, 68 | 657, 69 | 659, 70 | 666, 71 | 672, 72 | 673, 73 | 680, 74 | 706, 75 | 714, 76 | 721, 77 | 726, 78 | 731, 79 | 747, 80 | 769, 81 | 776, 82 | 781, 83 | 785, 84 | 836, 85 | 845, 86 | 847, 87 | 855, 88 | 868, 89 | 879, 90 | 882, 91 | 889, 92 | 918, 93 | 919, 94 | 927, 95 | 954, 96 | 965, 97 | 1004, 98 | 1011, 99 | 1017, 100 | 1020, 101 | 1021, 102 | 1026, 103 | 1032, 104 | 1041, 105 | 1049, 106 | 1070, 107 | 1075, 108 | 1078, 109 | 1079, 110 | 1085, 111 | 1087, 112 | 1100, 113 | 1103, 114 | 1107, 115 | 1117, 116 | 1118, 117 | 1140, 118 | 1145, 119 | 1147, 120 | 1149, 121 | 1152, 122 | 1156, 123 | 1166, 124 | 1177, 125 | 1209, 126 | 1211, 127 | 1218, 128 | 1225, 129 | 1231, 130 | 1233, 131 | 1243, 132 | 1251, 133 | 1261, 134 | 1262, 135 | 1272, 136 | 1289, 137 | 1295, 138 | 1296, 139 | 1299, 140 | 1304, 141 | 1325, 142 | 1329, 143 | 1346, 144 | 1347, 145 | 1350, 146 | 1359, 147 | 1374, 148 | 1404, 149 | 1405, 150 | 1412, 151 | 1433, 152 | 1435, 153 | 1451, 154 | 1452, 155 | 1455, 156 | 1464, 157 | 1479, 158 | 1493, 159 | 1509, 160 | 1522, 161 | 1523, 162 | 1541, 163 | 1550, 164 | 1553, 165 | 1564, 166 | 1573, 167 | 1578, 168 | 1586, 169 | 1587, 170 | 1594, 171 | 1597, 172 | 1598, 173 | 1599, 174 | 1609, 175 | 1611, 176 | 1615, 177 | 1623, 178 | 1630, 179 | 1646, 180 | 1649, 181 | 1650, 182 | 1652, 183 | 1654, 184 | 1657, 185 | 1658, 186 | 1669, 187 | 1675, 188 | 1684, 189 | 1692, 190 | 1696, 191 | 1707, 192 | 1727, 193 | 1731, 194 | 1782, 195 | 1800, 196 | 1820, 197 | 1831, 198 | 1847, 199 | 1863, 200 | 1871, 201 | 1880, 202 | 1903, 203 | 1917, 204 | 1920, 205 | 1939, 206 | 1958, 207 | 1970, 208 | 1985, 209 | 1992, 210 | 1995, 211 | 2004, 212 | 2007, 213 | 2023, 214 | 2026, 215 | 2035, 216 | 2048, 217 | 2067, 218 | 2083, 219 | 2091, 220 | 2098, 221 | 2102, 222 | 2107, 223 | 2108, 224 | 2118, 225 | 2127, 226 | 2140, 227 | 2142, 228 | 2143, 229 | 2148, 230 | 2166, 231 | 2169, 232 | 2171, 233 | 2178, 234 | 2190, 235 | 2199, 236 | 2206, 237 | 2213, 238 | 2221, 239 | 2222, 240 | 2223, 241 | 2225, 242 | 2253, 243 | 2266, 244 | 2280, 245 | 2281, 246 | 2292, 247 | 2294, 248 | 2299, 249 | 2305, 250 | 2312, 251 | 2328, 252 | 2335, 253 | 2356, 254 | 2396 255 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 18, 3 | 47, 4 | 50, 5 | 52, 6 | 53, 7 | 58, 8 | 65, 9 | 73, 10 | 75, 11 | 79, 12 | 97, 13 | 111, 14 | 113, 15 | 114, 16 | 164, 17 | 166, 18 | 194, 19 | 200, 20 | 205, 21 | 212, 22 | 213, 23 | 219, 24 | 233, 25 | 235, 26 | 236, 27 | 242, 28 | 245, 29 | 255, 30 | 281, 31 | 283, 32 | 285, 33 | 295, 34 | 318, 35 | 326, 36 | 332, 37 | 334, 38 | 345, 39 | 352, 40 | 354, 41 | 358, 42 | 360, 43 | 365, 44 | 375, 45 | 388, 46 | 400, 47 | 410, 48 | 440, 49 | 447, 50 | 449, 51 | 451, 52 | 452, 53 | 459, 54 | 463, 55 | 468, 56 | 474, 57 | 479, 58 | 480, 59 | 489, 60 | 493, 61 | 503, 62 | 509, 63 | 524, 64 | 536, 65 | 537, 66 | 544, 67 | 566, 68 | 570, 69 | 579, 70 | 608, 71 | 618, 72 | 630, 73 | 697, 74 | 719, 75 | 737, 76 | 746, 77 | 753, 78 | 754, 79 | 755, 80 | 783, 81 | 816, 82 | 820, 83 | 822, 84 | 832, 85 | 878, 86 | 885, 87 | 895, 88 | 908, 89 | 914, 90 | 925, 91 | 945, 92 | 951, 93 | 955, 94 | 957, 95 | 961, 96 | 962, 97 | 964, 98 | 975, 99 | 980, 100 | 988, 101 | 1005, 102 | 1027, 103 | 1052, 104 | 1057, 105 | 1059, 106 | 1061, 107 | 1089, 108 | 1120, 109 | 1123, 110 | 1144, 111 | 1170, 112 | 1178, 113 | 1181, 114 | 1189, 115 | 1203, 116 | 1215, 117 | 1234, 118 | 1280, 119 | 1282, 120 | 1291, 121 | 1298, 122 | 1300, 123 | 1308, 124 | 1317, 125 | 1318, 126 | 1339, 127 | 1345, 128 | 1377, 129 | 1383, 130 | 1408, 131 | 1426, 132 | 1427, 133 | 1430, 134 | 1436, 135 | 1440, 136 | 1441, 137 | 1444, 138 | 1446, 139 | 1448, 140 | 1457, 141 | 1465, 142 | 1466, 143 | 1470, 144 | 1476, 145 | 1497, 146 | 1502, 147 | 1511, 148 | 1513, 149 | 1520, 150 | 1531, 151 | 1532, 152 | 1539, 153 | 1561, 154 | 1569, 155 | 1579, 156 | 1589, 157 | 1592, 158 | 1618, 159 | 1648, 160 | 1673, 161 | 1678, 162 | 1679, 163 | 1693, 164 | 1706, 165 | 1720, 166 | 1739, 167 | 1766, 168 | 1772, 169 | 1775, 170 | 1778, 171 | 1789, 172 | 1809, 173 | 1819, 174 | 1835, 175 | 1848, 176 | 1870, 177 | 1876, 178 | 1884, 179 | 1887, 180 | 1888, 181 | 1891, 182 | 1892, 183 | 1895, 184 | 1910, 185 | 1912, 186 | 1913, 187 | 1937, 188 | 1964, 189 | 1967, 190 | 1987, 191 | 2002, 192 | 2012, 193 | 2021, 194 | 2029, 195 | 2050, 196 | 2053, 197 | 2079, 198 | 2089, 199 | 2101, 200 | 2103, 201 | 2116, 202 | 2130, 203 | 2131, 204 | 2133, 205 | 2145, 206 | 2156, 207 | 2161, 208 | 2170, 209 | 2184, 210 | 2185, 211 | 2189, 212 | 2197, 213 | 2205, 214 | 2214, 215 | 2243, 216 | 2269, 217 | 2270, 218 | 2301, 219 | 2319, 220 | 2322, 221 | 2326, 222 | 2330, 223 | 2343, 224 | 2345, 225 | 2353, 226 | 2354, 227 | 2377, 228 | 2384, 229 | 2386, 230 | 2389, 231 | 2395, 232 | 2397 233 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 9, 3 | 21, 4 | 26, 5 | 28, 6 | 29, 7 | 38, 8 | 39, 9 | 54, 10 | 62, 11 | 78, 12 | 81, 13 | 82, 14 | 90, 15 | 92, 16 | 102, 17 | 105, 18 | 108, 19 | 121, 20 | 126, 21 | 127, 22 | 151, 23 | 155, 24 | 165, 25 | 169, 26 | 179, 27 | 190, 28 | 226, 29 | 240, 30 | 241, 31 | 246, 32 | 251, 33 | 252, 34 | 260, 35 | 265, 36 | 266, 37 | 278, 38 | 287, 39 | 288, 40 | 297, 41 | 309, 42 | 313, 43 | 330, 44 | 356, 45 | 371, 46 | 406, 47 | 419, 48 | 425, 49 | 429, 50 | 434, 51 | 456, 52 | 476, 53 | 486, 54 | 499, 55 | 512, 56 | 522, 57 | 535, 58 | 551, 59 | 561, 60 | 573, 61 | 574, 62 | 586, 63 | 594, 64 | 599, 65 | 602, 66 | 612, 67 | 628, 68 | 631, 69 | 634, 70 | 636, 71 | 645, 72 | 646, 73 | 650, 74 | 654, 75 | 660, 76 | 665, 77 | 668, 78 | 676, 79 | 678, 80 | 682, 81 | 684, 82 | 723, 83 | 729, 84 | 732, 85 | 733, 86 | 743, 87 | 765, 88 | 767, 89 | 771, 90 | 774, 91 | 780, 92 | 784, 93 | 793, 94 | 799, 95 | 801, 96 | 804, 97 | 806, 98 | 811, 99 | 818, 100 | 827, 101 | 833, 102 | 838, 103 | 852, 104 | 854, 105 | 869, 106 | 881, 107 | 888, 108 | 903, 109 | 904, 110 | 909, 111 | 910, 112 | 912, 113 | 913, 114 | 915, 115 | 924, 116 | 928, 117 | 929, 118 | 936, 119 | 943, 120 | 944, 121 | 946, 122 | 952, 123 | 959, 124 | 967, 125 | 971, 126 | 982, 127 | 984, 128 | 989, 129 | 995, 130 | 1000, 131 | 1030, 132 | 1035, 133 | 1044, 134 | 1050, 135 | 1064, 136 | 1072, 137 | 1074, 138 | 1098, 139 | 1109, 140 | 1110, 141 | 1116, 142 | 1136, 143 | 1158, 144 | 1172, 145 | 1199, 146 | 1200, 147 | 1232, 148 | 1236, 149 | 1239, 150 | 1240, 151 | 1265, 152 | 1286, 153 | 1323, 154 | 1341, 155 | 1362, 156 | 1371, 157 | 1400, 158 | 1406, 159 | 1416, 160 | 1418, 161 | 1443, 162 | 1460, 163 | 1485, 164 | 1491, 165 | 1504, 166 | 1508, 167 | 1516, 168 | 1517, 169 | 1521, 170 | 1544, 171 | 1546, 172 | 1576, 173 | 1590, 174 | 1595, 175 | 1600, 176 | 1601, 177 | 1617, 178 | 1637, 179 | 1638, 180 | 1639, 181 | 1651, 182 | 1661, 183 | 1668, 184 | 1671, 185 | 1681, 186 | 1687, 187 | 1699, 188 | 1711, 189 | 1726, 190 | 1730, 191 | 1736, 192 | 1743, 193 | 1770, 194 | 1774, 195 | 1781, 196 | 1784, 197 | 1794, 198 | 1796, 199 | 1813, 200 | 1844, 201 | 1846, 202 | 1853, 203 | 1881, 204 | 1889, 205 | 1897, 206 | 1904, 207 | 1906, 208 | 1916, 209 | 1925, 210 | 1938, 211 | 1940, 212 | 1942, 213 | 1944, 214 | 1945, 215 | 1978, 216 | 2018, 217 | 2062, 218 | 2071, 219 | 2084, 220 | 2088, 221 | 2096, 222 | 2100, 223 | 2104, 224 | 2105, 225 | 2115, 226 | 2128, 227 | 2137, 228 | 2139, 229 | 2163, 230 | 2165, 231 | 2183, 232 | 2204, 233 | 2207, 234 | 2209, 235 | 2226, 236 | 2230, 237 | 2231, 238 | 2241, 239 | 2252, 240 | 2289, 241 | 2290, 242 | 2297, 243 | 2311, 244 | 2318, 245 | 2324, 246 | 2344, 247 | 2360, 248 | 2361, 249 | 2372, 250 | 2374, 251 | 2393, 252 | 2402 253 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 36, 4 | 37, 5 | 43, 6 | 44, 7 | 51, 8 | 77, 9 | 85, 10 | 88, 11 | 94, 12 | 100, 13 | 103, 14 | 125, 15 | 143, 16 | 149, 17 | 159, 18 | 182, 19 | 192, 20 | 195, 21 | 197, 22 | 198, 23 | 204, 24 | 214, 25 | 228, 26 | 239, 27 | 253, 28 | 263, 29 | 267, 30 | 280, 31 | 284, 32 | 294, 33 | 298, 34 | 299, 35 | 302, 36 | 306, 37 | 344, 38 | 355, 39 | 357, 40 | 359, 41 | 364, 42 | 368, 43 | 373, 44 | 377, 45 | 382, 46 | 387, 47 | 396, 48 | 401, 49 | 420, 50 | 431, 51 | 457, 52 | 458, 53 | 471, 54 | 478, 55 | 481, 56 | 483, 57 | 487, 58 | 488, 59 | 490, 60 | 518, 61 | 521, 62 | 523, 63 | 528, 64 | 542, 65 | 543, 66 | 549, 67 | 564, 68 | 592, 69 | 614, 70 | 627, 71 | 632, 72 | 641, 73 | 649, 74 | 662, 75 | 702, 76 | 703, 77 | 704, 78 | 717, 79 | 718, 80 | 760, 81 | 762, 82 | 764, 83 | 770, 84 | 772, 85 | 779, 86 | 790, 87 | 792, 88 | 796, 89 | 817, 90 | 842, 91 | 843, 92 | 844, 93 | 856, 94 | 860, 95 | 861, 96 | 865, 97 | 867, 98 | 887, 99 | 896, 100 | 899, 101 | 905, 102 | 907, 103 | 911, 104 | 931, 105 | 949, 106 | 960, 107 | 977, 108 | 993, 109 | 999, 110 | 1038, 111 | 1048, 112 | 1058, 113 | 1065, 114 | 1066, 115 | 1080, 116 | 1101, 117 | 1104, 118 | 1106, 119 | 1121, 120 | 1122, 121 | 1132, 122 | 1143, 123 | 1164, 124 | 1168, 125 | 1174, 126 | 1175, 127 | 1192, 128 | 1201, 129 | 1212, 130 | 1214, 131 | 1216, 132 | 1223, 133 | 1244, 134 | 1246, 135 | 1249, 136 | 1256, 137 | 1270, 138 | 1274, 139 | 1275, 140 | 1288, 141 | 1302, 142 | 1307, 143 | 1319, 144 | 1324, 145 | 1338, 146 | 1368, 147 | 1370, 148 | 1386, 149 | 1388, 150 | 1389, 151 | 1395, 152 | 1401, 153 | 1407, 154 | 1409, 155 | 1413, 156 | 1417, 157 | 1420, 158 | 1428, 159 | 1445, 160 | 1449, 161 | 1454, 162 | 1461, 163 | 1475, 164 | 1500, 165 | 1536, 166 | 1543, 167 | 1562, 168 | 1571, 169 | 1605, 170 | 1610, 171 | 1626, 172 | 1634, 173 | 1641, 174 | 1653, 175 | 1659, 176 | 1660, 177 | 1666, 178 | 1685, 179 | 1701, 180 | 1719, 181 | 1721, 182 | 1740, 183 | 1761, 184 | 1804, 185 | 1810, 186 | 1814, 187 | 1818, 188 | 1826, 189 | 1830, 190 | 1838, 191 | 1856, 192 | 1861, 193 | 1864, 194 | 1883, 195 | 1899, 196 | 1931, 197 | 1935, 198 | 1950, 199 | 1951, 200 | 1957, 201 | 1988, 202 | 1989, 203 | 1993, 204 | 2000, 205 | 2016, 206 | 2019, 207 | 2044, 208 | 2049, 209 | 2061, 210 | 2066, 211 | 2073, 212 | 2075, 213 | 2078, 214 | 2086, 215 | 2093, 216 | 2099, 217 | 2111, 218 | 2119, 219 | 2150, 220 | 2173, 221 | 2176, 222 | 2193, 223 | 2198, 224 | 2201, 225 | 2212, 226 | 2228, 227 | 2232, 228 | 2234, 229 | 2239, 230 | 2246, 231 | 2250, 232 | 2256, 233 | 2261, 234 | 2274, 235 | 2276, 236 | 2298, 237 | 2303, 238 | 2307, 239 | 2342, 240 | 2348, 241 | 2352, 242 | 2357, 243 | 2375, 244 | 2381, 245 | 2385, 246 | 2391, 247 | 2400 248 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 6, 3 | 20, 4 | 34, 5 | 40, 6 | 41, 7 | 57, 8 | 59, 9 | 66, 10 | 80, 11 | 96, 12 | 101, 13 | 107, 14 | 136, 15 | 146, 16 | 196, 17 | 207, 18 | 217, 19 | 222, 20 | 224, 21 | 296, 22 | 301, 23 | 307, 24 | 315, 25 | 319, 26 | 327, 27 | 341, 28 | 347, 29 | 376, 30 | 391, 31 | 392, 32 | 402, 33 | 413, 34 | 424, 35 | 433, 36 | 441, 37 | 442, 38 | 453, 39 | 461, 40 | 484, 41 | 491, 42 | 495, 43 | 539, 44 | 540, 45 | 576, 46 | 578, 47 | 598, 48 | 604, 49 | 625, 50 | 638, 51 | 639, 52 | 640, 53 | 643, 54 | 648, 55 | 661, 56 | 674, 57 | 675, 58 | 683, 59 | 686, 60 | 691, 61 | 705, 62 | 707, 63 | 713, 64 | 734, 65 | 735, 66 | 738, 67 | 739, 68 | 744, 69 | 758, 70 | 766, 71 | 786, 72 | 791, 73 | 798, 74 | 812, 75 | 835, 76 | 839, 77 | 858, 78 | 866, 79 | 874, 80 | 880, 81 | 883, 82 | 884, 83 | 893, 84 | 917, 85 | 934, 86 | 940, 87 | 941, 88 | 950, 89 | 968, 90 | 978, 91 | 981, 92 | 1015, 93 | 1016, 94 | 1046, 95 | 1051, 96 | 1056, 97 | 1077, 98 | 1086, 99 | 1093, 100 | 1099, 101 | 1108, 102 | 1119, 103 | 1125, 104 | 1130, 105 | 1134, 106 | 1142, 107 | 1148, 108 | 1151, 109 | 1160, 110 | 1191, 111 | 1193, 112 | 1197, 113 | 1208, 114 | 1252, 115 | 1266, 116 | 1267, 117 | 1273, 118 | 1277, 119 | 1278, 120 | 1279, 121 | 1294, 122 | 1303, 123 | 1320, 124 | 1335, 125 | 1343, 126 | 1349, 127 | 1355, 128 | 1358, 129 | 1360, 130 | 1378, 131 | 1379, 132 | 1394, 133 | 1431, 134 | 1434, 135 | 1458, 136 | 1478, 137 | 1495, 138 | 1514, 139 | 1515, 140 | 1526, 141 | 1535, 142 | 1549, 143 | 1554, 144 | 1563, 145 | 1582, 146 | 1583, 147 | 1593, 148 | 1604, 149 | 1608, 150 | 1629, 151 | 1635, 152 | 1643, 153 | 1644, 154 | 1665, 155 | 1670, 156 | 1672, 157 | 1683, 158 | 1691, 159 | 1700, 160 | 1704, 161 | 1717, 162 | 1725, 163 | 1728, 164 | 1737, 165 | 1738, 166 | 1750, 167 | 1753, 168 | 1762, 169 | 1765, 170 | 1768, 171 | 1769, 172 | 1779, 173 | 1785, 174 | 1807, 175 | 1866, 176 | 1868, 177 | 1875, 178 | 1879, 179 | 1882, 180 | 1885, 181 | 1909, 182 | 1915, 183 | 1922, 184 | 1926, 185 | 1933, 186 | 1954, 187 | 1976, 188 | 1979, 189 | 1996, 190 | 2001, 191 | 2003, 192 | 2022, 193 | 2033, 194 | 2040, 195 | 2047, 196 | 2052, 197 | 2058, 198 | 2059, 199 | 2072, 200 | 2085, 201 | 2097, 202 | 2155, 203 | 2172, 204 | 2180, 205 | 2194, 206 | 2196, 207 | 2208, 208 | 2218, 209 | 2224, 210 | 2293, 211 | 2300, 212 | 2304, 213 | 2306, 214 | 2309, 215 | 2315, 216 | 2316, 217 | 2317, 218 | 2336, 219 | 2340, 220 | 2358, 221 | 2365, 222 | 2368, 223 | 2376, 224 | 2399 225 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 4, 4 | 12, 5 | 23, 6 | 33, 7 | 35, 8 | 45, 9 | 49, 10 | 55, 11 | 86, 12 | 87, 13 | 98, 14 | 112, 15 | 119, 16 | 131, 17 | 132, 18 | 138, 19 | 152, 20 | 158, 21 | 160, 22 | 173, 23 | 178, 24 | 188, 25 | 191, 26 | 201, 27 | 232, 28 | 237, 29 | 257, 30 | 259, 31 | 261, 32 | 262, 33 | 273, 34 | 274, 35 | 279, 36 | 312, 37 | 314, 38 | 316, 39 | 333, 40 | 351, 41 | 367, 42 | 374, 43 | 379, 44 | 383, 45 | 385, 46 | 386, 47 | 399, 48 | 409, 49 | 412, 50 | 414, 51 | 418, 52 | 448, 53 | 473, 54 | 492, 55 | 497, 56 | 510, 57 | 511, 58 | 530, 59 | 562, 60 | 569, 61 | 581, 62 | 582, 63 | 596, 64 | 603, 65 | 607, 66 | 615, 67 | 626, 68 | 633, 69 | 652, 70 | 658, 71 | 688, 72 | 710, 73 | 712, 74 | 716, 75 | 736, 76 | 742, 77 | 745, 78 | 751, 79 | 752, 80 | 761, 81 | 775, 82 | 778, 83 | 782, 84 | 800, 85 | 809, 86 | 813, 87 | 819, 88 | 825, 89 | 829, 90 | 830, 91 | 840, 92 | 841, 93 | 850, 94 | 851, 95 | 853, 96 | 921, 97 | 947, 98 | 973, 99 | 979, 100 | 987, 101 | 996, 102 | 1006, 103 | 1012, 104 | 1014, 105 | 1024, 106 | 1034, 107 | 1036, 108 | 1039, 109 | 1053, 110 | 1054, 111 | 1062, 112 | 1069, 113 | 1073, 114 | 1091, 115 | 1095, 116 | 1096, 117 | 1105, 118 | 1113, 119 | 1115, 120 | 1124, 121 | 1135, 122 | 1176, 123 | 1180, 124 | 1182, 125 | 1187, 126 | 1217, 127 | 1221, 128 | 1228, 129 | 1230, 130 | 1238, 131 | 1263, 132 | 1276, 133 | 1283, 134 | 1284, 135 | 1285, 136 | 1310, 137 | 1321, 138 | 1330, 139 | 1348, 140 | 1352, 141 | 1366, 142 | 1367, 143 | 1382, 144 | 1387, 145 | 1402, 146 | 1411, 147 | 1414, 148 | 1415, 149 | 1421, 150 | 1422, 151 | 1423, 152 | 1432, 153 | 1437, 154 | 1438, 155 | 1442, 156 | 1459, 157 | 1473, 158 | 1480, 159 | 1490, 160 | 1498, 161 | 1501, 162 | 1506, 163 | 1518, 164 | 1533, 165 | 1534, 166 | 1542, 167 | 1545, 168 | 1552, 169 | 1556, 170 | 1560, 171 | 1580, 172 | 1581, 173 | 1631, 174 | 1636, 175 | 1642, 176 | 1647, 177 | 1677, 178 | 1680, 179 | 1682, 180 | 1689, 181 | 1698, 182 | 1709, 183 | 1712, 184 | 1713, 185 | 1716, 186 | 1756, 187 | 1763, 188 | 1783, 189 | 1795, 190 | 1797, 191 | 1798, 192 | 1803, 193 | 1811, 194 | 1816, 195 | 1823, 196 | 1824, 197 | 1834, 198 | 1837, 199 | 1841, 200 | 1845, 201 | 1854, 202 | 1857, 203 | 1865, 204 | 1873, 205 | 1878, 206 | 1896, 207 | 1914, 208 | 1952, 209 | 1974, 210 | 1975, 211 | 1982, 212 | 1984, 213 | 2015, 214 | 2017, 215 | 2025, 216 | 2031, 217 | 2032, 218 | 2034, 219 | 2036, 220 | 2039, 221 | 2043, 222 | 2046, 223 | 2054, 224 | 2060, 225 | 2063, 226 | 2064, 227 | 2065, 228 | 2112, 229 | 2121, 230 | 2122, 231 | 2125, 232 | 2136, 233 | 2141, 234 | 2149, 235 | 2154, 236 | 2168, 237 | 2181, 238 | 2186, 239 | 2200, 240 | 2216, 241 | 2219, 242 | 2220, 243 | 2229, 244 | 2248, 245 | 2249, 246 | 2254, 247 | 2263, 248 | 2264, 249 | 2265, 250 | 2284, 251 | 2288, 252 | 2296, 253 | 2310, 254 | 2313, 255 | 2327, 256 | 2337, 257 | 2338, 258 | 2339, 259 | 2350, 260 | 2364, 261 | 2371, 262 | 2383, 263 | 2388, 264 | 2390, 265 | 2403 266 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 5, 3 | 7, 4 | 8, 5 | 13, 6 | 16, 7 | 19, 8 | 71, 9 | 72, 10 | 74, 11 | 110, 12 | 115, 13 | 120, 14 | 124, 15 | 135, 16 | 139, 17 | 153, 18 | 161, 19 | 172, 20 | 177, 21 | 186, 22 | 187, 23 | 199, 24 | 203, 25 | 209, 26 | 220, 27 | 225, 28 | 258, 29 | 272, 30 | 282, 31 | 290, 32 | 304, 33 | 317, 34 | 325, 35 | 337, 36 | 338, 37 | 342, 38 | 346, 39 | 348, 40 | 361, 41 | 363, 42 | 370, 43 | 394, 44 | 407, 45 | 416, 46 | 417, 47 | 421, 48 | 427, 49 | 432, 50 | 439, 51 | 450, 52 | 455, 53 | 467, 54 | 482, 55 | 502, 56 | 514, 57 | 516, 58 | 517, 59 | 527, 60 | 531, 61 | 532, 62 | 546, 63 | 550, 64 | 553, 65 | 557, 66 | 559, 67 | 571, 68 | 585, 69 | 600, 70 | 601, 71 | 610, 72 | 619, 73 | 620, 74 | 624, 75 | 656, 76 | 667, 77 | 687, 78 | 689, 79 | 690, 80 | 692, 81 | 694, 82 | 695, 83 | 700, 84 | 711, 85 | 724, 86 | 749, 87 | 757, 88 | 777, 89 | 795, 90 | 802, 91 | 803, 92 | 815, 93 | 823, 94 | 826, 95 | 828, 96 | 849, 97 | 863, 98 | 871, 99 | 872, 100 | 873, 101 | 877, 102 | 891, 103 | 897, 104 | 916, 105 | 920, 106 | 923, 107 | 930, 108 | 933, 109 | 935, 110 | 953, 111 | 976, 112 | 997, 113 | 998, 114 | 1001, 115 | 1003, 116 | 1018, 117 | 1022, 118 | 1029, 119 | 1033, 120 | 1047, 121 | 1055, 122 | 1060, 123 | 1128, 124 | 1204, 125 | 1213, 126 | 1235, 127 | 1250, 128 | 1254, 129 | 1257, 130 | 1260, 131 | 1264, 132 | 1287, 133 | 1305, 134 | 1309, 135 | 1314, 136 | 1328, 137 | 1331, 138 | 1333, 139 | 1337, 140 | 1340, 141 | 1354, 142 | 1357, 143 | 1375, 144 | 1381, 145 | 1385, 146 | 1390, 147 | 1419, 148 | 1424, 149 | 1425, 150 | 1450, 151 | 1453, 152 | 1462, 153 | 1477, 154 | 1488, 155 | 1492, 156 | 1494, 157 | 1505, 158 | 1525, 159 | 1551, 160 | 1558, 161 | 1619, 162 | 1655, 163 | 1662, 164 | 1663, 165 | 1674, 166 | 1694, 167 | 1695, 168 | 1703, 169 | 1714, 170 | 1732, 171 | 1735, 172 | 1742, 173 | 1744, 174 | 1746, 175 | 1752, 176 | 1805, 177 | 1821, 178 | 1828, 179 | 1836, 180 | 1843, 181 | 1849, 182 | 1860, 183 | 1867, 184 | 1890, 185 | 1893, 186 | 1894, 187 | 1908, 188 | 1923, 189 | 1924, 190 | 1927, 191 | 1928, 192 | 1936, 193 | 1941, 194 | 1955, 195 | 1960, 196 | 1963, 197 | 1977, 198 | 1981, 199 | 1983, 200 | 1990, 201 | 1991, 202 | 2005, 203 | 2006, 204 | 2009, 205 | 2028, 206 | 2037, 207 | 2041, 208 | 2068, 209 | 2077, 210 | 2082, 211 | 2090, 212 | 2106, 213 | 2113, 214 | 2129, 215 | 2134, 216 | 2151, 217 | 2152, 218 | 2153, 219 | 2167, 220 | 2182, 221 | 2187, 222 | 2192, 223 | 2202, 224 | 2211, 225 | 2233, 226 | 2240, 227 | 2247, 228 | 2251, 229 | 2257, 230 | 2258, 231 | 2268, 232 | 2273, 233 | 2275, 234 | 2277, 235 | 2285, 236 | 2308, 237 | 2320, 238 | 2329, 239 | 2347, 240 | 2351, 241 | 2363, 242 | 2379, 243 | 2401 244 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 14, 4 | 31, 5 | 83, 6 | 93, 7 | 116, 8 | 117, 9 | 144, 10 | 145, 11 | 150, 12 | 162, 13 | 170, 14 | 174, 15 | 184, 16 | 185, 17 | 189, 18 | 202, 19 | 210, 20 | 215, 21 | 247, 22 | 248, 23 | 264, 24 | 270, 25 | 275, 26 | 276, 27 | 289, 28 | 292, 29 | 293, 30 | 305, 31 | 329, 32 | 340, 33 | 362, 34 | 378, 35 | 389, 36 | 397, 37 | 415, 38 | 428, 39 | 435, 40 | 436, 41 | 443, 42 | 444, 43 | 446, 44 | 464, 45 | 470, 46 | 472, 47 | 475, 48 | 477, 49 | 496, 50 | 501, 51 | 506, 52 | 519, 53 | 541, 54 | 554, 55 | 577, 56 | 588, 57 | 589, 58 | 605, 59 | 606, 60 | 616, 61 | 629, 62 | 635, 63 | 642, 64 | 651, 65 | 653, 66 | 669, 67 | 671, 68 | 681, 69 | 701, 70 | 715, 71 | 722, 72 | 728, 73 | 740, 74 | 741, 75 | 748, 76 | 759, 77 | 763, 78 | 768, 79 | 773, 80 | 787, 81 | 797, 82 | 824, 83 | 846, 84 | 875, 85 | 876, 86 | 902, 87 | 958, 88 | 963, 89 | 966, 90 | 969, 91 | 972, 92 | 974, 93 | 986, 94 | 990, 95 | 991, 96 | 994, 97 | 1008, 98 | 1037, 99 | 1045, 100 | 1071, 101 | 1083, 102 | 1088, 103 | 1092, 104 | 1097, 105 | 1111, 106 | 1129, 107 | 1133, 108 | 1138, 109 | 1157, 110 | 1159, 111 | 1162, 112 | 1171, 113 | 1185, 114 | 1190, 115 | 1195, 116 | 1196, 117 | 1198, 118 | 1207, 119 | 1224, 120 | 1229, 121 | 1237, 122 | 1245, 123 | 1253, 124 | 1255, 125 | 1258, 126 | 1281, 127 | 1293, 128 | 1306, 129 | 1313, 130 | 1316, 131 | 1322, 132 | 1327, 133 | 1332, 134 | 1336, 135 | 1356, 136 | 1365, 137 | 1372, 138 | 1373, 139 | 1380, 140 | 1391, 141 | 1392, 142 | 1396, 143 | 1403, 144 | 1410, 145 | 1429, 146 | 1447, 147 | 1463, 148 | 1467, 149 | 1468, 150 | 1474, 151 | 1483, 152 | 1486, 153 | 1487, 154 | 1496, 155 | 1499, 156 | 1510, 157 | 1524, 158 | 1529, 159 | 1530, 160 | 1538, 161 | 1540, 162 | 1548, 163 | 1555, 164 | 1559, 165 | 1565, 166 | 1566, 167 | 1568, 168 | 1575, 169 | 1602, 170 | 1621, 171 | 1686, 172 | 1688, 173 | 1697, 174 | 1702, 175 | 1722, 176 | 1724, 177 | 1733, 178 | 1745, 179 | 1749, 180 | 1755, 181 | 1759, 182 | 1764, 183 | 1776, 184 | 1786, 185 | 1788, 186 | 1791, 187 | 1792, 188 | 1793, 189 | 1801, 190 | 1806, 191 | 1825, 192 | 1827, 193 | 1829, 194 | 1842, 195 | 1852, 196 | 1859, 197 | 1862, 198 | 1877, 199 | 1900, 200 | 1901, 201 | 1911, 202 | 1918, 203 | 1929, 204 | 1930, 205 | 1934, 206 | 1953, 207 | 1961, 208 | 1968, 209 | 1969, 210 | 1972, 211 | 1997, 212 | 1998, 213 | 2045, 214 | 2076, 215 | 2087, 216 | 2094, 217 | 2114, 218 | 2120, 219 | 2123, 220 | 2124, 221 | 2138, 222 | 2147, 223 | 2158, 224 | 2160, 225 | 2174, 226 | 2179, 227 | 2188, 228 | 2191, 229 | 2195, 230 | 2210, 231 | 2236, 232 | 2237, 233 | 2242, 234 | 2244, 235 | 2255, 236 | 2262, 237 | 2271, 238 | 2278, 239 | 2286, 240 | 2287, 241 | 2314, 242 | 2332, 243 | 2333, 244 | 2341, 245 | 2362, 246 | 2373, 247 | 2392 248 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/arxiv/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 15, 3 | 17, 4 | 24, 5 | 27, 6 | 30, 7 | 32, 8 | 68, 9 | 69, 10 | 70, 11 | 89, 12 | 109, 13 | 128, 14 | 130, 15 | 134, 16 | 137, 17 | 156, 18 | 175, 19 | 206, 20 | 218, 21 | 223, 22 | 230, 23 | 244, 24 | 250, 25 | 254, 26 | 269, 27 | 271, 28 | 286, 29 | 303, 30 | 323, 31 | 328, 32 | 331, 33 | 343, 34 | 349, 35 | 380, 36 | 381, 37 | 384, 38 | 405, 39 | 411, 40 | 438, 41 | 445, 42 | 469, 43 | 485, 44 | 498, 45 | 500, 46 | 507, 47 | 529, 48 | 534, 49 | 547, 50 | 555, 51 | 563, 52 | 575, 53 | 584, 54 | 590, 55 | 593, 56 | 621, 57 | 663, 58 | 664, 59 | 670, 60 | 679, 61 | 685, 62 | 693, 63 | 696, 64 | 698, 65 | 750, 66 | 789, 67 | 814, 68 | 831, 69 | 837, 70 | 848, 71 | 862, 72 | 864, 73 | 886, 74 | 890, 75 | 894, 76 | 906, 77 | 938, 78 | 942, 79 | 948, 80 | 956, 81 | 985, 82 | 992, 83 | 1007, 84 | 1009, 85 | 1010, 86 | 1019, 87 | 1031, 88 | 1040, 89 | 1043, 90 | 1067, 91 | 1068, 92 | 1081, 93 | 1090, 94 | 1094, 95 | 1112, 96 | 1114, 97 | 1137, 98 | 1141, 99 | 1154, 100 | 1163, 101 | 1169, 102 | 1173, 103 | 1183, 104 | 1184, 105 | 1186, 106 | 1188, 107 | 1202, 108 | 1205, 109 | 1227, 110 | 1241, 111 | 1247, 112 | 1269, 113 | 1271, 114 | 1290, 115 | 1292, 116 | 1297, 117 | 1311, 118 | 1326, 119 | 1361, 120 | 1363, 121 | 1364, 122 | 1376, 123 | 1439, 124 | 1456, 125 | 1472, 126 | 1482, 127 | 1489, 128 | 1503, 129 | 1507, 130 | 1519, 131 | 1527, 132 | 1528, 133 | 1567, 134 | 1574, 135 | 1577, 136 | 1584, 137 | 1585, 138 | 1588, 139 | 1591, 140 | 1612, 141 | 1616, 142 | 1620, 143 | 1622, 144 | 1625, 145 | 1627, 146 | 1632, 147 | 1664, 148 | 1667, 149 | 1676, 150 | 1690, 151 | 1715, 152 | 1723, 153 | 1729, 154 | 1747, 155 | 1751, 156 | 1754, 157 | 1757, 158 | 1758, 159 | 1760, 160 | 1767, 161 | 1771, 162 | 1777, 163 | 1787, 164 | 1799, 165 | 1808, 166 | 1817, 167 | 1822, 168 | 1832, 169 | 1833, 170 | 1839, 171 | 1850, 172 | 1851, 173 | 1855, 174 | 1902, 175 | 1905, 176 | 1907, 177 | 1919, 178 | 1921, 179 | 1948, 180 | 1949, 181 | 1956, 182 | 1959, 183 | 1962, 184 | 1965, 185 | 1980, 186 | 1986, 187 | 1994, 188 | 2010, 189 | 2011, 190 | 2024, 191 | 2055, 192 | 2057, 193 | 2069, 194 | 2074, 195 | 2080, 196 | 2095, 197 | 2132, 198 | 2135, 199 | 2146, 200 | 2159, 201 | 2175, 202 | 2235, 203 | 2238, 204 | 2245, 205 | 2282, 206 | 2283, 207 | 2331, 208 | 2334, 209 | 2346, 210 | 2349, 211 | 2355, 212 | 2394, 213 | 2398, 214 | 2406 215 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 6, 3 | 9, 4 | 11, 5 | 17, 6 | 24, 7 | 59, 8 | 62, 9 | 67, 10 | 69, 11 | 80, 12 | 99, 13 | 105, 14 | 136, 15 | 154, 16 | 156, 17 | 189, 18 | 190, 19 | 200, 20 | 233 21 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 10, 3 | 14, 4 | 23, 5 | 25, 6 | 37, 7 | 38, 8 | 57, 9 | 61, 10 | 71, 11 | 79, 12 | 92, 13 | 94, 14 | 107, 15 | 112, 16 | 137, 17 | 155, 18 | 181, 19 | 192, 20 | 199, 21 | 206, 22 | 238, 23 | 240, 24 | 253, 25 | 255, 26 | 259, 27 | 264 28 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 8, 4 | 22, 5 | 26, 6 | 30, 7 | 43, 8 | 48, 9 | 50, 10 | 96, 11 | 103, 12 | 111, 13 | 115, 14 | 131, 15 | 139, 16 | 140, 17 | 141, 18 | 142, 19 | 166, 20 | 170, 21 | 172, 22 | 180, 23 | 182, 24 | 194, 25 | 224, 26 | 234, 27 | 241, 28 | 244, 29 | 254, 30 | 265 31 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 29, 3 | 40, 4 | 46, 5 | 53, 6 | 65, 7 | 82, 8 | 88, 9 | 90, 10 | 93, 11 | 97, 12 | 98, 13 | 123, 14 | 165, 15 | 171, 16 | 198, 17 | 205, 18 | 228, 19 | 229, 20 | 232, 21 | 235, 22 | 256, 23 | 263, 24 | 268 25 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 4, 3 | 27, 4 | 49, 5 | 83, 6 | 84, 7 | 85, 8 | 89, 9 | 104, 10 | 119, 11 | 149, 12 | 151, 13 | 168, 14 | 173, 15 | 185, 16 | 187, 17 | 196, 18 | 201, 19 | 212, 20 | 221, 21 | 227, 22 | 231, 23 | 237, 24 | 239, 25 | 245, 26 | 249, 27 | 251 28 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 16, 4 | 41, 5 | 42, 6 | 47, 7 | 51, 8 | 52, 9 | 58, 10 | 60, 11 | 64, 12 | 66, 13 | 70, 14 | 73, 15 | 77, 16 | 91, 17 | 95, 18 | 109, 19 | 113, 20 | 116, 21 | 130, 22 | 132, 23 | 138, 24 | 146, 25 | 147, 26 | 157, 27 | 175, 28 | 191, 29 | 197, 30 | 209, 31 | 211, 32 | 213, 33 | 215, 34 | 220, 35 | 246, 36 | 257, 37 | 258, 38 | 260, 39 | 267 40 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 7, 4 | 19, 5 | 33, 6 | 44, 7 | 45, 8 | 55, 9 | 75, 10 | 81, 11 | 127, 12 | 133, 13 | 143, 14 | 150, 15 | 152, 16 | 159, 17 | 160, 18 | 161, 19 | 163, 20 | 177, 21 | 184, 22 | 214, 23 | 219, 24 | 222, 25 | 236, 26 | 247 27 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 12, 3 | 18, 4 | 21, 5 | 32, 6 | 34, 7 | 39, 8 | 63, 9 | 76, 10 | 87, 11 | 100, 12 | 117, 13 | 120, 14 | 124, 15 | 125, 16 | 145, 17 | 153, 18 | 167, 19 | 176, 20 | 179, 21 | 183, 22 | 188, 23 | 195, 24 | 207, 25 | 208, 26 | 210, 27 | 226, 28 | 243 29 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 5, 4 | 15, 5 | 20, 6 | 31, 7 | 35, 8 | 54, 9 | 68, 10 | 72, 11 | 102, 12 | 108, 13 | 126, 14 | 128, 15 | 135, 16 | 164, 17 | 178, 18 | 202, 19 | 203, 20 | 217, 21 | 230, 22 | 252, 23 | 266 24 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/bibliotik/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 13, 3 | 28, 4 | 36, 5 | 56, 6 | 74, 7 | 78, 8 | 86, 9 | 101, 10 | 106, 11 | 110, 12 | 114, 13 | 118, 14 | 121, 15 | 122, 16 | 129, 17 | 134, 18 | 144, 19 | 148, 20 | 158, 21 | 162, 22 | 169, 23 | 174, 24 | 186, 25 | 193, 26 | 204, 27 | 216, 28 | 218, 29 | 223, 30 | 225, 31 | 242, 32 | 248, 33 | 250, 34 | 261, 35 | 262 36 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 4, 3 | 12, 4 | 20, 5 | 33, 6 | 34, 7 | 40, 8 | 58, 9 | 70, 10 | 77, 11 | 100, 12 | 111, 13 | 120, 14 | 121, 15 | 126, 16 | 134, 17 | 171, 18 | 205, 19 | 232, 20 | 252, 21 | 260, 22 | 263, 23 | 264, 24 | 280, 25 | 296, 26 | 302, 27 | 323, 28 | 345, 29 | 347, 30 | 361, 31 | 379, 32 | 391, 33 | 399, 34 | 412, 35 | 427, 36 | 430, 37 | 441, 38 | 452, 39 | 455, 40 | 480, 41 | 500, 42 | 501, 43 | 518, 44 | 525, 45 | 527, 46 | 538, 47 | 542, 48 | 543, 49 | 553, 50 | 563, 51 | 582, 52 | 588, 53 | 601, 54 | 612, 55 | 614, 56 | 650, 57 | 674, 58 | 693, 59 | 696, 60 | 702, 61 | 713, 62 | 714, 63 | 715, 64 | 718, 65 | 737, 66 | 750, 67 | 767, 68 | 771, 69 | 781, 70 | 792, 71 | 809, 72 | 814, 73 | 821, 74 | 841, 75 | 863, 76 | 881, 77 | 883, 78 | 888, 79 | 892, 80 | 896, 81 | 899, 82 | 917, 83 | 929, 84 | 942, 85 | 954, 86 | 956, 87 | 965, 88 | 977, 89 | 980, 90 | 981, 91 | 987, 92 | 988, 93 | 1001, 94 | 1007, 95 | 1008, 96 | 1009, 97 | 1021, 98 | 1055, 99 | 1062, 100 | 1083, 101 | 1089, 102 | 1091, 103 | 1108, 104 | 1125, 105 | 1146, 106 | 1151, 107 | 1162, 108 | 1167, 109 | 1192, 110 | 1195, 111 | 1197, 112 | 1216, 113 | 1217, 114 | 1239, 115 | 1241, 116 | 1245, 117 | 1249, 118 | 1254, 119 | 1266, 120 | 1268, 121 | 1276, 122 | 1297, 123 | 1311, 124 | 1320, 125 | 1328, 126 | 1342, 127 | 1350, 128 | 1353, 129 | 1378, 130 | 1399, 131 | 1404, 132 | 1417, 133 | 1435, 134 | 1455, 135 | 1456, 136 | 1458, 137 | 1468, 138 | 1475, 139 | 1484, 140 | 1488, 141 | 1491, 142 | 1512, 143 | 1525, 144 | 1530, 145 | 1535, 146 | 1536, 147 | 1554, 148 | 1557, 149 | 1562, 150 | 1578, 151 | 1585, 152 | 1603, 153 | 1612, 154 | 1619, 155 | 1625, 156 | 1628, 157 | 1629, 158 | 1634, 159 | 1644, 160 | 1653, 161 | 1668, 162 | 1674, 163 | 1682, 164 | 1698, 165 | 1707, 166 | 1709, 167 | 1744, 168 | 1751, 169 | 1760, 170 | 1776, 171 | 1784, 172 | 1792, 173 | 1795, 174 | 1806, 175 | 1807, 176 | 1816, 177 | 1817, 178 | 1828, 179 | 1829, 180 | 1833, 181 | 1839, 182 | 1853, 183 | 1871, 184 | 1900, 185 | 1910, 186 | 1914, 187 | 1921 188 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 21, 3 | 36, 4 | 42, 5 | 50, 6 | 57, 7 | 59, 8 | 61, 9 | 63, 10 | 64, 11 | 65, 12 | 82, 13 | 90, 14 | 91, 15 | 97, 16 | 103, 17 | 104, 18 | 113, 19 | 122, 20 | 124, 21 | 127, 22 | 137, 23 | 152, 24 | 176, 25 | 195, 26 | 199, 27 | 200, 28 | 204, 29 | 207, 30 | 214, 31 | 217, 32 | 230, 33 | 246, 34 | 253, 35 | 262, 36 | 266, 37 | 273, 38 | 282, 39 | 294, 40 | 299, 41 | 300, 42 | 317, 43 | 327, 44 | 334, 45 | 335, 46 | 337, 47 | 338, 48 | 343, 49 | 383, 50 | 408, 51 | 423, 52 | 424, 53 | 456, 54 | 457, 55 | 460, 56 | 470, 57 | 493, 58 | 496, 59 | 520, 60 | 526, 61 | 528, 62 | 529, 63 | 536, 64 | 548, 65 | 549, 66 | 555, 67 | 580, 68 | 607, 69 | 622, 70 | 638, 71 | 642, 72 | 657, 73 | 661, 74 | 680, 75 | 683, 76 | 711, 77 | 723, 78 | 725, 79 | 756, 80 | 760, 81 | 764, 82 | 765, 83 | 776, 84 | 782, 85 | 793, 86 | 806, 87 | 817, 88 | 830, 89 | 845, 90 | 865, 91 | 872, 92 | 874, 93 | 879, 94 | 886, 95 | 915, 96 | 918, 97 | 921, 98 | 922, 99 | 932, 100 | 959, 101 | 975, 102 | 978, 103 | 993, 104 | 1005, 105 | 1014, 106 | 1026, 107 | 1047, 108 | 1052, 109 | 1066, 110 | 1082, 111 | 1087, 112 | 1128, 113 | 1130, 114 | 1131, 115 | 1147, 116 | 1148, 117 | 1158, 118 | 1160, 119 | 1179, 120 | 1198, 121 | 1207, 122 | 1225, 123 | 1230, 124 | 1231, 125 | 1244, 126 | 1259, 127 | 1272, 128 | 1279, 129 | 1299, 130 | 1306, 131 | 1338, 132 | 1343, 133 | 1365, 134 | 1379, 135 | 1387, 136 | 1388, 137 | 1405, 138 | 1412, 139 | 1420, 140 | 1426, 141 | 1443, 142 | 1446, 143 | 1461, 144 | 1469, 145 | 1472, 146 | 1485, 147 | 1496, 148 | 1497, 149 | 1516, 150 | 1521, 151 | 1544, 152 | 1551, 153 | 1556, 154 | 1560, 155 | 1569, 156 | 1571, 157 | 1584, 158 | 1596, 159 | 1597, 160 | 1604, 161 | 1616, 162 | 1638, 163 | 1639, 164 | 1665, 165 | 1666, 166 | 1712, 167 | 1716, 168 | 1726, 169 | 1748, 170 | 1752, 171 | 1757, 172 | 1758, 173 | 1775, 174 | 1785, 175 | 1802, 176 | 1815, 177 | 1827, 178 | 1834, 179 | 1859, 180 | 1861, 181 | 1875, 182 | 1876, 183 | 1881, 184 | 1893, 185 | 1913 186 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 22, 3 | 46, 4 | 56, 5 | 68, 6 | 80, 7 | 99, 8 | 107, 9 | 108, 10 | 114, 11 | 115, 12 | 128, 13 | 155, 14 | 160, 15 | 161, 16 | 170, 17 | 188, 18 | 192, 19 | 202, 20 | 240, 21 | 248, 22 | 250, 23 | 251, 24 | 275, 25 | 308, 26 | 309, 27 | 315, 28 | 316, 29 | 322, 30 | 332, 31 | 333, 32 | 339, 33 | 344, 34 | 351, 35 | 354, 36 | 355, 37 | 359, 38 | 362, 39 | 370, 40 | 389, 41 | 398, 42 | 402, 43 | 405, 44 | 407, 45 | 409, 46 | 411, 47 | 440, 48 | 453, 49 | 474, 50 | 484, 51 | 505, 52 | 508, 53 | 511, 54 | 516, 55 | 522, 56 | 523, 57 | 557, 58 | 564, 59 | 572, 60 | 578, 61 | 596, 62 | 616, 63 | 627, 64 | 632, 65 | 633, 66 | 648, 67 | 651, 68 | 653, 69 | 658, 70 | 677, 71 | 684, 72 | 695, 73 | 704, 74 | 720, 75 | 730, 76 | 734, 77 | 738, 78 | 755, 79 | 773, 80 | 778, 81 | 804, 82 | 805, 83 | 808, 84 | 810, 85 | 822, 86 | 839, 87 | 852, 88 | 861, 89 | 875, 90 | 885, 91 | 960, 92 | 969, 93 | 979, 94 | 992, 95 | 996, 96 | 999, 97 | 1000, 98 | 1006, 99 | 1046, 100 | 1061, 101 | 1077, 102 | 1078, 103 | 1081, 104 | 1097, 105 | 1132, 106 | 1140, 107 | 1171, 108 | 1172, 109 | 1185, 110 | 1193, 111 | 1201, 112 | 1208, 113 | 1233, 114 | 1261, 115 | 1270, 116 | 1278, 117 | 1286, 118 | 1290, 119 | 1291, 120 | 1309, 121 | 1310, 122 | 1329, 123 | 1340, 124 | 1341, 125 | 1347, 126 | 1349, 127 | 1356, 128 | 1367, 129 | 1371, 130 | 1402, 131 | 1408, 132 | 1419, 133 | 1427, 134 | 1431, 135 | 1440, 136 | 1444, 137 | 1462, 138 | 1466, 139 | 1487, 140 | 1505, 141 | 1548, 142 | 1550, 143 | 1552, 144 | 1564, 145 | 1594, 146 | 1605, 147 | 1642, 148 | 1646, 149 | 1650, 150 | 1659, 151 | 1669, 152 | 1670, 153 | 1671, 154 | 1683, 155 | 1693, 156 | 1702, 157 | 1708, 158 | 1728, 159 | 1743, 160 | 1763, 161 | 1772, 162 | 1788, 163 | 1793, 164 | 1803, 165 | 1813, 166 | 1824, 167 | 1837, 168 | 1846, 169 | 1858, 170 | 1906, 171 | 1917, 172 | 1920 173 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 11, 4 | 19, 5 | 32, 6 | 51, 7 | 60, 8 | 87, 9 | 116, 10 | 139, 11 | 140, 12 | 142, 13 | 146, 14 | 147, 15 | 150, 16 | 158, 17 | 162, 18 | 172, 19 | 173, 20 | 179, 21 | 212, 22 | 213, 23 | 219, 24 | 225, 25 | 229, 26 | 234, 27 | 241, 28 | 257, 29 | 261, 30 | 270, 31 | 272, 32 | 277, 33 | 292, 34 | 295, 35 | 297, 36 | 324, 37 | 329, 38 | 357, 39 | 358, 40 | 366, 41 | 375, 42 | 390, 43 | 395, 44 | 414, 45 | 418, 46 | 435, 47 | 467, 48 | 469, 49 | 471, 50 | 477, 51 | 486, 52 | 488, 53 | 495, 54 | 506, 55 | 519, 56 | 524, 57 | 537, 58 | 568, 59 | 570, 60 | 571, 61 | 573, 62 | 585, 63 | 587, 64 | 595, 65 | 597, 66 | 609, 67 | 617, 68 | 645, 69 | 666, 70 | 669, 71 | 673, 72 | 676, 73 | 706, 74 | 716, 75 | 719, 76 | 721, 77 | 722, 78 | 732, 79 | 733, 80 | 735, 81 | 739, 82 | 749, 83 | 752, 84 | 770, 85 | 787, 86 | 811, 87 | 812, 88 | 823, 89 | 824, 90 | 829, 91 | 833, 92 | 835, 93 | 842, 94 | 846, 95 | 855, 96 | 856, 97 | 868, 98 | 871, 99 | 878, 100 | 891, 101 | 901, 102 | 904, 103 | 907, 104 | 910, 105 | 916, 106 | 939, 107 | 947, 108 | 971, 109 | 982, 110 | 983, 111 | 991, 112 | 998, 113 | 1004, 114 | 1024, 115 | 1036, 116 | 1040, 117 | 1048, 118 | 1060, 119 | 1067, 120 | 1072, 121 | 1075, 122 | 1084, 123 | 1088, 124 | 1093, 125 | 1098, 126 | 1103, 127 | 1106, 128 | 1107, 129 | 1110, 130 | 1118, 131 | 1165, 132 | 1174, 133 | 1182, 134 | 1191, 135 | 1218, 136 | 1247, 137 | 1250, 138 | 1257, 139 | 1281, 140 | 1284, 141 | 1314, 142 | 1335, 143 | 1355, 144 | 1372, 145 | 1377, 146 | 1386, 147 | 1397, 148 | 1406, 149 | 1410, 150 | 1411, 151 | 1415, 152 | 1441, 153 | 1445, 154 | 1448, 155 | 1459, 156 | 1460, 157 | 1480, 158 | 1489, 159 | 1493, 160 | 1495, 161 | 1499, 162 | 1500, 163 | 1503, 164 | 1513, 165 | 1520, 166 | 1524, 167 | 1528, 168 | 1538, 169 | 1545, 170 | 1549, 171 | 1561, 172 | 1566, 173 | 1593, 174 | 1623, 175 | 1643, 176 | 1654, 177 | 1655, 178 | 1657, 179 | 1678, 180 | 1697, 181 | 1705, 182 | 1725, 183 | 1737, 184 | 1745, 185 | 1749, 186 | 1755, 187 | 1773, 188 | 1777, 189 | 1789, 190 | 1809, 191 | 1810, 192 | 1838, 193 | 1840, 194 | 1844, 195 | 1852, 196 | 1855, 197 | 1868, 198 | 1869, 199 | 1895, 200 | 1896, 201 | 1908 202 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 13, 4 | 18, 5 | 23, 6 | 27, 7 | 35, 8 | 54, 9 | 83, 10 | 88, 11 | 93, 12 | 112, 13 | 119, 14 | 130, 15 | 135, 16 | 141, 17 | 157, 18 | 159, 19 | 165, 20 | 167, 21 | 174, 22 | 177, 23 | 180, 24 | 187, 25 | 193, 26 | 223, 27 | 228, 28 | 244, 29 | 265, 30 | 287, 31 | 298, 32 | 307, 33 | 319, 34 | 356, 35 | 376, 36 | 387, 37 | 392, 38 | 394, 39 | 396, 40 | 404, 41 | 415, 42 | 432, 43 | 433, 44 | 437, 45 | 438, 46 | 446, 47 | 482, 48 | 492, 49 | 507, 50 | 510, 51 | 535, 52 | 546, 53 | 552, 54 | 556, 55 | 559, 56 | 575, 57 | 581, 58 | 605, 59 | 606, 60 | 629, 61 | 630, 62 | 631, 63 | 668, 64 | 688, 65 | 689, 66 | 694, 67 | 712, 68 | 742, 69 | 745, 70 | 757, 71 | 758, 72 | 768, 73 | 772, 74 | 779, 75 | 791, 76 | 803, 77 | 816, 78 | 820, 79 | 831, 80 | 840, 81 | 844, 82 | 851, 83 | 860, 84 | 866, 85 | 898, 86 | 903, 87 | 905, 88 | 911, 89 | 919, 90 | 931, 91 | 935, 92 | 953, 93 | 955, 94 | 967, 95 | 968, 96 | 985, 97 | 997, 98 | 1003, 99 | 1013, 100 | 1016, 101 | 1018, 102 | 1045, 103 | 1050, 104 | 1057, 105 | 1094, 106 | 1096, 107 | 1111, 108 | 1112, 109 | 1154, 110 | 1155, 111 | 1161, 112 | 1163, 113 | 1170, 114 | 1175, 115 | 1176, 116 | 1183, 117 | 1194, 118 | 1199, 119 | 1200, 120 | 1203, 121 | 1221, 122 | 1226, 123 | 1236, 124 | 1237, 125 | 1238, 126 | 1274, 127 | 1277, 128 | 1285, 129 | 1289, 130 | 1301, 131 | 1303, 132 | 1318, 133 | 1321, 134 | 1332, 135 | 1354, 136 | 1357, 137 | 1359, 138 | 1368, 139 | 1381, 140 | 1385, 141 | 1391, 142 | 1395, 143 | 1439, 144 | 1449, 145 | 1453, 146 | 1454, 147 | 1490, 148 | 1504, 149 | 1518, 150 | 1542, 151 | 1543, 152 | 1559, 153 | 1567, 154 | 1586, 155 | 1601, 156 | 1602, 157 | 1609, 158 | 1610, 159 | 1618, 160 | 1620, 161 | 1630, 162 | 1645, 163 | 1651, 164 | 1658, 165 | 1660, 166 | 1662, 167 | 1672, 168 | 1673, 169 | 1677, 170 | 1715, 171 | 1733, 172 | 1766, 173 | 1768, 174 | 1769, 175 | 1787, 176 | 1791, 177 | 1796, 178 | 1812, 179 | 1835, 180 | 1856, 181 | 1860, 182 | 1863, 183 | 1872, 184 | 1874, 185 | 1889, 186 | 1898, 187 | 1905, 188 | 1912 189 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 7, 3 | 14, 4 | 25, 5 | 37, 6 | 39, 7 | 53, 8 | 67, 9 | 71, 10 | 86, 11 | 92, 12 | 96, 13 | 149, 14 | 151, 15 | 156, 16 | 178, 17 | 184, 18 | 206, 19 | 220, 20 | 221, 21 | 236, 22 | 238, 23 | 245, 24 | 255, 25 | 258, 26 | 274, 27 | 281, 28 | 283, 29 | 288, 30 | 303, 31 | 306, 32 | 312, 33 | 318, 34 | 321, 35 | 325, 36 | 350, 37 | 352, 38 | 360, 39 | 369, 40 | 374, 41 | 378, 42 | 386, 43 | 393, 44 | 400, 45 | 420, 46 | 436, 47 | 442, 48 | 445, 49 | 448, 50 | 462, 51 | 475, 52 | 479, 53 | 481, 54 | 483, 55 | 490, 56 | 534, 57 | 540, 58 | 560, 59 | 567, 60 | 584, 61 | 590, 62 | 592, 63 | 603, 64 | 613, 65 | 628, 66 | 635, 67 | 641, 68 | 643, 69 | 647, 70 | 654, 71 | 660, 72 | 670, 73 | 675, 74 | 681, 75 | 697, 76 | 710, 77 | 748, 78 | 751, 79 | 761, 80 | 775, 81 | 780, 82 | 786, 83 | 790, 84 | 800, 85 | 802, 86 | 819, 87 | 825, 88 | 832, 89 | 838, 90 | 854, 91 | 857, 92 | 858, 93 | 862, 94 | 864, 95 | 877, 96 | 882, 97 | 893, 98 | 895, 99 | 913, 100 | 914, 101 | 928, 102 | 958, 103 | 961, 104 | 976, 105 | 990, 106 | 1011, 107 | 1015, 108 | 1020, 109 | 1022, 110 | 1032, 111 | 1034, 112 | 1039, 113 | 1051, 114 | 1063, 115 | 1070, 116 | 1076, 117 | 1080, 118 | 1090, 119 | 1092, 120 | 1116, 121 | 1117, 122 | 1121, 123 | 1126, 124 | 1137, 125 | 1143, 126 | 1153, 127 | 1157, 128 | 1189, 129 | 1209, 130 | 1222, 131 | 1240, 132 | 1242, 133 | 1246, 134 | 1251, 135 | 1252, 136 | 1255, 137 | 1260, 138 | 1263, 139 | 1287, 140 | 1292, 141 | 1300, 142 | 1304, 143 | 1313, 144 | 1334, 145 | 1344, 146 | 1362, 147 | 1363, 148 | 1373, 149 | 1390, 150 | 1421, 151 | 1424, 152 | 1425, 153 | 1438, 154 | 1450, 155 | 1467, 156 | 1470, 157 | 1479, 158 | 1481, 159 | 1494, 160 | 1511, 161 | 1534, 162 | 1539, 163 | 1574, 164 | 1575, 165 | 1583, 166 | 1587, 167 | 1590, 168 | 1599, 169 | 1608, 170 | 1613, 171 | 1621, 172 | 1633, 173 | 1635, 174 | 1640, 175 | 1667, 176 | 1679, 177 | 1681, 178 | 1685, 179 | 1686, 180 | 1688, 181 | 1696, 182 | 1706, 183 | 1711, 184 | 1713, 185 | 1717, 186 | 1718, 187 | 1719, 188 | 1722, 189 | 1727, 190 | 1739, 191 | 1740, 192 | 1741, 193 | 1750, 194 | 1753, 195 | 1756, 196 | 1762, 197 | 1780, 198 | 1781, 199 | 1786, 200 | 1790, 201 | 1821, 202 | 1825, 203 | 1830, 204 | 1862, 205 | 1864, 206 | 1867, 207 | 1870, 208 | 1877, 209 | 1882, 210 | 1883, 211 | 1890, 212 | 1911 213 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 5, 4 | 8, 5 | 28, 6 | 29, 7 | 38, 8 | 47, 9 | 48, 10 | 72, 11 | 73, 12 | 94, 13 | 95, 14 | 102, 15 | 118, 16 | 132, 17 | 144, 18 | 189, 19 | 216, 20 | 227, 21 | 235, 22 | 237, 23 | 243, 24 | 249, 25 | 256, 26 | 268, 27 | 271, 28 | 284, 29 | 310, 30 | 314, 31 | 340, 32 | 342, 33 | 346, 34 | 348, 35 | 363, 36 | 365, 37 | 368, 38 | 371, 39 | 380, 40 | 388, 41 | 403, 42 | 459, 43 | 465, 44 | 466, 45 | 472, 46 | 498, 47 | 503, 48 | 512, 49 | 513, 50 | 551, 51 | 554, 52 | 569, 53 | 574, 54 | 618, 55 | 623, 56 | 639, 57 | 663, 58 | 664, 59 | 665, 60 | 672, 61 | 679, 62 | 698, 63 | 708, 64 | 717, 65 | 741, 66 | 747, 67 | 762, 68 | 783, 69 | 785, 70 | 796, 71 | 799, 72 | 807, 73 | 828, 74 | 847, 75 | 853, 76 | 876, 77 | 894, 78 | 900, 79 | 924, 80 | 925, 81 | 926, 82 | 927, 83 | 930, 84 | 933, 85 | 936, 86 | 937, 87 | 945, 88 | 949, 89 | 963, 90 | 984, 91 | 986, 92 | 1017, 93 | 1033, 94 | 1038, 95 | 1041, 96 | 1042, 97 | 1043, 98 | 1049, 99 | 1056, 100 | 1086, 101 | 1100, 102 | 1109, 103 | 1119, 104 | 1120, 105 | 1123, 106 | 1138, 107 | 1141, 108 | 1204, 109 | 1210, 110 | 1215, 111 | 1220, 112 | 1227, 113 | 1229, 114 | 1234, 115 | 1256, 116 | 1262, 117 | 1282, 118 | 1288, 119 | 1302, 120 | 1305, 121 | 1315, 122 | 1317, 123 | 1319, 124 | 1324, 125 | 1326, 126 | 1331, 127 | 1348, 128 | 1351, 129 | 1358, 130 | 1360, 131 | 1369, 132 | 1374, 133 | 1382, 134 | 1389, 135 | 1409, 136 | 1433, 137 | 1434, 138 | 1436, 139 | 1437, 140 | 1465, 141 | 1477, 142 | 1482, 143 | 1502, 144 | 1509, 145 | 1517, 146 | 1526, 147 | 1529, 148 | 1537, 149 | 1547, 150 | 1555, 151 | 1568, 152 | 1572, 153 | 1573, 154 | 1579, 155 | 1582, 156 | 1591, 157 | 1598, 158 | 1607, 159 | 1611, 160 | 1622, 161 | 1636, 162 | 1664, 163 | 1695, 164 | 1700, 165 | 1701, 166 | 1704, 167 | 1710, 168 | 1714, 169 | 1723, 170 | 1724, 171 | 1747, 172 | 1759, 173 | 1765, 174 | 1774, 175 | 1778, 176 | 1799, 177 | 1808, 178 | 1818, 179 | 1820, 180 | 1826, 181 | 1841, 182 | 1842, 183 | 1843, 184 | 1848, 185 | 1849, 186 | 1857, 187 | 1865, 188 | 1880, 189 | 1886, 190 | 1891, 191 | 1901 192 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 10, 4 | 17, 5 | 26, 6 | 30, 7 | 41, 8 | 44, 9 | 49, 10 | 76, 11 | 79, 12 | 84, 13 | 89, 14 | 98, 15 | 101, 16 | 125, 17 | 133, 18 | 136, 19 | 145, 20 | 186, 21 | 190, 22 | 197, 23 | 208, 24 | 210, 25 | 222, 26 | 224, 27 | 247, 28 | 254, 29 | 259, 30 | 269, 31 | 278, 32 | 279, 33 | 285, 34 | 304, 35 | 305, 36 | 311, 37 | 328, 38 | 331, 39 | 341, 40 | 372, 41 | 397, 42 | 401, 43 | 419, 44 | 421, 45 | 425, 46 | 429, 47 | 434, 48 | 439, 49 | 447, 50 | 450, 51 | 461, 52 | 464, 53 | 468, 54 | 473, 55 | 476, 56 | 478, 57 | 487, 58 | 499, 59 | 502, 60 | 509, 61 | 531, 62 | 544, 63 | 547, 64 | 562, 65 | 579, 66 | 583, 67 | 589, 68 | 598, 69 | 599, 70 | 604, 71 | 615, 72 | 624, 73 | 625, 74 | 636, 75 | 649, 76 | 726, 77 | 727, 78 | 731, 79 | 743, 80 | 766, 81 | 777, 82 | 788, 83 | 815, 84 | 818, 85 | 834, 86 | 836, 87 | 843, 88 | 849, 89 | 897, 90 | 902, 91 | 908, 92 | 923, 93 | 941, 94 | 943, 95 | 946, 96 | 948, 97 | 966, 98 | 974, 99 | 989, 100 | 994, 101 | 1019, 102 | 1035, 103 | 1058, 104 | 1064, 105 | 1065, 106 | 1068, 107 | 1069, 108 | 1071, 109 | 1074, 110 | 1099, 111 | 1101, 112 | 1102, 113 | 1104, 114 | 1113, 115 | 1114, 116 | 1115, 117 | 1127, 118 | 1144, 119 | 1152, 120 | 1159, 121 | 1177, 122 | 1178, 123 | 1184, 124 | 1188, 125 | 1196, 126 | 1205, 127 | 1213, 128 | 1214, 129 | 1228, 130 | 1235, 131 | 1243, 132 | 1253, 133 | 1258, 134 | 1264, 135 | 1267, 136 | 1280, 137 | 1298, 138 | 1316, 139 | 1325, 140 | 1330, 141 | 1333, 142 | 1339, 143 | 1364, 144 | 1366, 145 | 1375, 146 | 1394, 147 | 1400, 148 | 1418, 149 | 1429, 150 | 1447, 151 | 1464, 152 | 1471, 153 | 1473, 154 | 1474, 155 | 1483, 156 | 1486, 157 | 1492, 158 | 1501, 159 | 1506, 160 | 1508, 161 | 1514, 162 | 1519, 163 | 1527, 164 | 1533, 165 | 1540, 166 | 1541, 167 | 1558, 168 | 1563, 169 | 1570, 170 | 1576, 171 | 1592, 172 | 1615, 173 | 1624, 174 | 1632, 175 | 1637, 176 | 1648, 177 | 1652, 178 | 1656, 179 | 1661, 180 | 1675, 181 | 1687, 182 | 1691, 183 | 1692, 184 | 1729, 185 | 1731, 186 | 1732, 187 | 1736, 188 | 1767, 189 | 1771, 190 | 1779, 191 | 1797, 192 | 1805, 193 | 1814, 194 | 1822, 195 | 1823, 196 | 1866, 197 | 1873, 198 | 1899, 199 | 1907, 200 | 1909, 201 | 1918, 202 | 1919 203 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 9, 3 | 16, 4 | 24, 5 | 31, 6 | 43, 7 | 45, 8 | 55, 9 | 62, 10 | 69, 11 | 74, 12 | 75, 13 | 78, 14 | 81, 15 | 105, 16 | 106, 17 | 109, 18 | 117, 19 | 123, 20 | 148, 21 | 153, 22 | 154, 23 | 164, 24 | 166, 25 | 183, 26 | 194, 27 | 196, 28 | 201, 29 | 209, 30 | 211, 31 | 215, 32 | 218, 33 | 226, 34 | 239, 35 | 242, 36 | 267, 37 | 276, 38 | 286, 39 | 291, 40 | 313, 41 | 326, 42 | 349, 43 | 353, 44 | 364, 45 | 377, 46 | 382, 47 | 384, 48 | 406, 49 | 413, 50 | 416, 51 | 422, 52 | 426, 53 | 444, 54 | 454, 55 | 463, 56 | 489, 57 | 497, 58 | 504, 59 | 514, 60 | 515, 61 | 521, 62 | 532, 63 | 533, 64 | 545, 65 | 558, 66 | 561, 67 | 565, 68 | 576, 69 | 586, 70 | 591, 71 | 593, 72 | 602, 73 | 608, 74 | 611, 75 | 619, 76 | 621, 77 | 626, 78 | 634, 79 | 644, 80 | 659, 81 | 667, 82 | 671, 83 | 678, 84 | 682, 85 | 685, 86 | 687, 87 | 690, 88 | 691, 89 | 699, 90 | 703, 91 | 705, 92 | 724, 93 | 728, 94 | 736, 95 | 740, 96 | 746, 97 | 754, 98 | 784, 99 | 789, 100 | 795, 101 | 797, 102 | 798, 103 | 801, 104 | 813, 105 | 826, 106 | 837, 107 | 867, 108 | 870, 109 | 880, 110 | 884, 111 | 889, 112 | 890, 113 | 906, 114 | 909, 115 | 912, 116 | 934, 117 | 944, 118 | 951, 119 | 957, 120 | 964, 121 | 970, 122 | 972, 123 | 995, 124 | 1012, 125 | 1023, 126 | 1028, 127 | 1029, 128 | 1031, 129 | 1054, 130 | 1073, 131 | 1079, 132 | 1135, 133 | 1139, 134 | 1166, 135 | 1173, 136 | 1181, 137 | 1190, 138 | 1212, 139 | 1269, 140 | 1271, 141 | 1275, 142 | 1283, 143 | 1294, 144 | 1296, 145 | 1307, 146 | 1322, 147 | 1327, 148 | 1336, 149 | 1345, 150 | 1370, 151 | 1376, 152 | 1383, 153 | 1384, 154 | 1392, 155 | 1393, 156 | 1396, 157 | 1403, 158 | 1413, 159 | 1428, 160 | 1432, 161 | 1451, 162 | 1452, 163 | 1476, 164 | 1498, 165 | 1507, 166 | 1510, 167 | 1515, 168 | 1531, 169 | 1546, 170 | 1565, 171 | 1577, 172 | 1581, 173 | 1589, 174 | 1595, 175 | 1606, 176 | 1614, 177 | 1626, 178 | 1627, 179 | 1631, 180 | 1641, 181 | 1649, 182 | 1680, 183 | 1689, 184 | 1690, 185 | 1699, 186 | 1720, 187 | 1730, 188 | 1735, 189 | 1738, 190 | 1742, 191 | 1746, 192 | 1754, 193 | 1761, 194 | 1782, 195 | 1800, 196 | 1811, 197 | 1819, 198 | 1831, 199 | 1845, 200 | 1851, 201 | 1879, 202 | 1897, 203 | 1903, 204 | 1915, 205 | 1916 206 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/dm-mathematics/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 6, 3 | 15, 4 | 52, 5 | 66, 6 | 85, 7 | 110, 8 | 129, 9 | 131, 10 | 138, 11 | 143, 12 | 163, 13 | 168, 14 | 169, 15 | 175, 16 | 181, 17 | 182, 18 | 185, 19 | 191, 20 | 198, 21 | 203, 22 | 231, 23 | 233, 24 | 289, 25 | 290, 26 | 293, 27 | 301, 28 | 320, 29 | 330, 30 | 336, 31 | 367, 32 | 373, 33 | 381, 34 | 385, 35 | 410, 36 | 417, 37 | 428, 38 | 431, 39 | 443, 40 | 449, 41 | 451, 42 | 458, 43 | 485, 44 | 491, 45 | 494, 46 | 517, 47 | 530, 48 | 539, 49 | 541, 50 | 550, 51 | 566, 52 | 577, 53 | 594, 54 | 600, 55 | 610, 56 | 620, 57 | 637, 58 | 640, 59 | 646, 60 | 652, 61 | 655, 62 | 656, 63 | 662, 64 | 686, 65 | 692, 66 | 700, 67 | 701, 68 | 707, 69 | 709, 70 | 729, 71 | 744, 72 | 753, 73 | 759, 74 | 763, 75 | 769, 76 | 774, 77 | 794, 78 | 827, 79 | 848, 80 | 850, 81 | 859, 82 | 869, 83 | 873, 84 | 887, 85 | 920, 86 | 938, 87 | 940, 88 | 950, 89 | 952, 90 | 962, 91 | 973, 92 | 1002, 93 | 1010, 94 | 1025, 95 | 1027, 96 | 1030, 97 | 1037, 98 | 1044, 99 | 1053, 100 | 1059, 101 | 1085, 102 | 1095, 103 | 1105, 104 | 1122, 105 | 1124, 106 | 1129, 107 | 1133, 108 | 1134, 109 | 1136, 110 | 1142, 111 | 1145, 112 | 1149, 113 | 1150, 114 | 1156, 115 | 1164, 116 | 1168, 117 | 1169, 118 | 1180, 119 | 1186, 120 | 1187, 121 | 1202, 122 | 1206, 123 | 1211, 124 | 1219, 125 | 1223, 126 | 1224, 127 | 1232, 128 | 1248, 129 | 1265, 130 | 1273, 131 | 1293, 132 | 1295, 133 | 1308, 134 | 1312, 135 | 1323, 136 | 1337, 137 | 1346, 138 | 1352, 139 | 1361, 140 | 1380, 141 | 1398, 142 | 1401, 143 | 1407, 144 | 1414, 145 | 1416, 146 | 1422, 147 | 1423, 148 | 1430, 149 | 1442, 150 | 1457, 151 | 1463, 152 | 1478, 153 | 1522, 154 | 1523, 155 | 1532, 156 | 1553, 157 | 1580, 158 | 1588, 159 | 1600, 160 | 1617, 161 | 1647, 162 | 1663, 163 | 1676, 164 | 1684, 165 | 1694, 166 | 1703, 167 | 1721, 168 | 1734, 169 | 1764, 170 | 1770, 171 | 1783, 172 | 1794, 173 | 1798, 174 | 1801, 175 | 1804, 176 | 1832, 177 | 1836, 178 | 1847, 179 | 1850, 180 | 1854, 181 | 1878, 182 | 1884, 183 | 1885, 184 | 1887, 185 | 1888, 186 | 1892, 187 | 1894, 188 | 1902, 189 | 1904 190 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 11, 4 | 32, 5 | 46, 6 | 52, 7 | 63, 8 | 82, 9 | 84, 10 | 88, 11 | 94, 12 | 96, 13 | 100, 14 | 101, 15 | 103, 16 | 108, 17 | 110, 18 | 112, 19 | 123, 20 | 136, 21 | 151, 22 | 172, 23 | 184, 24 | 198, 25 | 199, 26 | 227, 27 | 235, 28 | 236, 29 | 238, 30 | 244, 31 | 260, 32 | 262, 33 | 263, 34 | 271, 35 | 282, 36 | 288, 37 | 337, 38 | 343, 39 | 352, 40 | 361, 41 | 364, 42 | 376, 43 | 381, 44 | 384, 45 | 391, 46 | 399, 47 | 409, 48 | 416, 49 | 434, 50 | 435, 51 | 440, 52 | 454, 53 | 457, 54 | 461, 55 | 462, 56 | 474, 57 | 476, 58 | 478, 59 | 491, 60 | 494, 61 | 531, 62 | 535, 63 | 539, 64 | 544, 65 | 566, 66 | 568, 67 | 584, 68 | 627, 69 | 641, 70 | 642, 71 | 643, 72 | 669, 73 | 671, 74 | 687, 75 | 706, 76 | 713, 77 | 725, 78 | 750, 79 | 753, 80 | 763, 81 | 769, 82 | 774, 83 | 790, 84 | 795, 85 | 799, 86 | 816, 87 | 821, 88 | 830, 89 | 835, 90 | 840, 91 | 856, 92 | 866, 93 | 881, 94 | 910, 95 | 916, 96 | 917, 97 | 923, 98 | 941, 99 | 945, 100 | 969, 101 | 981, 102 | 989, 103 | 999 104 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 12, 3 | 18, 4 | 19, 5 | 38, 6 | 42, 7 | 53, 8 | 55, 9 | 72, 10 | 83, 11 | 85, 12 | 118, 13 | 134, 14 | 154, 15 | 168, 16 | 182, 17 | 183, 18 | 196, 19 | 200, 20 | 201, 21 | 203, 22 | 205, 23 | 206, 24 | 208, 25 | 248, 26 | 274, 27 | 279, 28 | 284, 29 | 299, 30 | 310, 31 | 318, 32 | 336, 33 | 347, 34 | 349, 35 | 354, 36 | 367, 37 | 369, 38 | 377, 39 | 394, 40 | 407, 41 | 410, 42 | 418, 43 | 420, 44 | 433, 45 | 438, 46 | 442, 47 | 452, 48 | 459, 49 | 492, 50 | 509, 51 | 515, 52 | 519, 53 | 520, 54 | 543, 55 | 551, 56 | 600, 57 | 606, 58 | 607, 59 | 610, 60 | 614, 61 | 621, 62 | 639, 63 | 663, 64 | 674, 65 | 679, 66 | 686, 67 | 702, 68 | 707, 69 | 708, 70 | 714, 71 | 724, 72 | 736, 73 | 737, 74 | 749, 75 | 775, 76 | 778, 77 | 781, 78 | 789, 79 | 796, 80 | 810, 81 | 812, 82 | 823, 83 | 826, 84 | 832, 85 | 836, 86 | 857, 87 | 872, 88 | 883, 89 | 894, 90 | 913, 91 | 937, 92 | 951, 93 | 958, 94 | 959, 95 | 974, 96 | 975, 97 | 976, 98 | 978, 99 | 996, 100 | 1008 101 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 29, 3 | 35, 4 | 56, 5 | 61, 6 | 64, 7 | 79, 8 | 81, 9 | 91, 10 | 102, 11 | 115, 12 | 116, 13 | 120, 14 | 122, 15 | 128, 16 | 147, 17 | 170, 18 | 173, 19 | 185, 20 | 187, 21 | 190, 22 | 193, 23 | 207, 24 | 211, 25 | 233, 26 | 245, 27 | 247, 28 | 252, 29 | 265, 30 | 267, 31 | 293, 32 | 295, 33 | 302, 34 | 303, 35 | 314, 36 | 322, 37 | 332, 38 | 335, 39 | 342, 40 | 346, 41 | 371, 42 | 378, 43 | 379, 44 | 385, 45 | 395, 46 | 412, 47 | 430, 48 | 443, 49 | 445, 50 | 447, 51 | 466, 52 | 467, 53 | 475, 54 | 480, 55 | 495, 56 | 507, 57 | 524, 58 | 528, 59 | 537, 60 | 553, 61 | 557, 62 | 562, 63 | 563, 64 | 564, 65 | 567, 66 | 580, 67 | 596, 68 | 624, 69 | 625, 70 | 650, 71 | 683, 72 | 710, 73 | 715, 74 | 717, 75 | 726, 76 | 739, 77 | 747, 78 | 756, 79 | 768, 80 | 787, 81 | 794, 82 | 802, 83 | 803, 84 | 817, 85 | 818, 86 | 828, 87 | 831, 88 | 839, 89 | 850, 90 | 860, 91 | 864, 92 | 877, 93 | 885, 94 | 886, 95 | 895, 96 | 922, 97 | 934, 98 | 960, 99 | 963, 100 | 965, 101 | 973, 102 | 982, 103 | 1001 104 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 6, 4 | 8, 5 | 13, 6 | 16, 7 | 28, 8 | 31, 9 | 39, 10 | 41, 11 | 51, 12 | 58, 13 | 77, 14 | 89, 15 | 125, 16 | 127, 17 | 132, 18 | 144, 19 | 213, 20 | 226, 21 | 228, 22 | 268, 23 | 275, 24 | 281, 25 | 289, 26 | 298, 27 | 305, 28 | 316, 29 | 319, 30 | 320, 31 | 321, 32 | 333, 33 | 345, 34 | 362, 35 | 382, 36 | 386, 37 | 389, 38 | 392, 39 | 397, 40 | 402, 41 | 404, 42 | 439, 43 | 441, 44 | 460, 45 | 477, 46 | 483, 47 | 498, 48 | 500, 49 | 508, 50 | 518, 51 | 523, 52 | 569, 53 | 583, 54 | 587, 55 | 589, 56 | 612, 57 | 626, 58 | 637, 59 | 666, 60 | 668, 61 | 678, 62 | 690, 63 | 694, 64 | 719, 65 | 730, 66 | 732, 67 | 758, 68 | 761, 69 | 766, 70 | 772, 71 | 788, 72 | 791, 73 | 800, 74 | 808, 75 | 809, 76 | 825, 77 | 837, 78 | 858, 79 | 862, 80 | 868, 81 | 869, 82 | 878, 83 | 889, 84 | 892, 85 | 896, 86 | 903, 87 | 904, 88 | 905, 89 | 906, 90 | 908, 91 | 911, 92 | 920, 93 | 921, 94 | 938, 95 | 939, 96 | 948, 97 | 964, 98 | 967, 99 | 986, 100 | 1007 101 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 7, 3 | 20, 4 | 33, 5 | 48, 6 | 49, 7 | 62, 8 | 68, 9 | 75, 10 | 76, 11 | 93, 12 | 98, 13 | 106, 14 | 117, 15 | 119, 16 | 126, 17 | 135, 18 | 138, 19 | 143, 20 | 195, 21 | 197, 22 | 202, 23 | 210, 24 | 216, 25 | 217, 26 | 223, 27 | 225, 28 | 239, 29 | 246, 30 | 249, 31 | 250, 32 | 264, 33 | 270, 34 | 273, 35 | 283, 36 | 292, 37 | 304, 38 | 309, 39 | 323, 40 | 341, 41 | 353, 42 | 355, 43 | 370, 44 | 380, 45 | 406, 46 | 421, 47 | 431, 48 | 448, 49 | 458, 50 | 472, 51 | 488, 52 | 499, 53 | 503, 54 | 505, 55 | 510, 56 | 536, 57 | 538, 58 | 546, 59 | 550, 60 | 556, 61 | 565, 62 | 576, 63 | 591, 64 | 592, 65 | 593, 66 | 601, 67 | 605, 68 | 608, 69 | 609, 70 | 646, 71 | 659, 72 | 664, 73 | 698, 74 | 718, 75 | 720, 76 | 727, 77 | 728, 78 | 734, 79 | 735, 80 | 741, 81 | 757, 82 | 785, 83 | 798, 84 | 805, 85 | 815, 86 | 843, 87 | 844, 88 | 874, 89 | 876, 90 | 898, 91 | 902, 92 | 942, 93 | 943, 94 | 950, 95 | 957, 96 | 972, 97 | 979, 98 | 985, 99 | 988, 100 | 990, 101 | 991, 102 | 993 103 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 15, 3 | 27, 4 | 30, 5 | 37, 6 | 43, 7 | 45, 8 | 66, 9 | 70, 10 | 105, 11 | 111, 12 | 129, 13 | 131, 14 | 142, 15 | 150, 16 | 157, 17 | 163, 18 | 165, 19 | 167, 20 | 175, 21 | 180, 22 | 186, 23 | 189, 24 | 192, 25 | 194, 26 | 218, 27 | 243, 28 | 251, 29 | 254, 30 | 277, 31 | 280, 32 | 291, 33 | 296, 34 | 306, 35 | 308, 36 | 312, 37 | 340, 38 | 359, 39 | 365, 40 | 372, 41 | 374, 42 | 375, 43 | 388, 44 | 400, 45 | 403, 46 | 413, 47 | 422, 48 | 423, 49 | 428, 50 | 450, 51 | 453, 52 | 482, 53 | 487, 54 | 497, 55 | 506, 56 | 511, 57 | 514, 58 | 527, 59 | 534, 60 | 540, 61 | 552, 62 | 558, 63 | 560, 64 | 582, 65 | 590, 66 | 597, 67 | 628, 68 | 629, 69 | 640, 70 | 644, 71 | 661, 72 | 680, 73 | 701, 74 | 703, 75 | 705, 76 | 716, 77 | 723, 78 | 731, 79 | 738, 80 | 743, 81 | 744, 82 | 745, 83 | 759, 84 | 780, 85 | 813, 86 | 820, 87 | 822, 88 | 846, 89 | 847, 90 | 852, 91 | 861, 92 | 867, 93 | 870, 94 | 880, 95 | 897, 96 | 909, 97 | 925, 98 | 926, 99 | 966, 100 | 980, 101 | 994, 102 | 998, 103 | 1000, 104 | 1004, 105 | 1006 106 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 17, 4 | 73, 5 | 99, 6 | 107, 7 | 113, 8 | 121, 9 | 139, 10 | 148, 11 | 149, 12 | 160, 13 | 161, 14 | 166, 15 | 176, 16 | 188, 17 | 214, 18 | 219, 19 | 230, 20 | 231, 21 | 237, 22 | 242, 23 | 255, 24 | 259, 25 | 266, 26 | 269, 27 | 278, 28 | 294, 29 | 300, 30 | 301, 31 | 313, 32 | 315, 33 | 317, 34 | 329, 35 | 344, 36 | 348, 37 | 350, 38 | 351, 39 | 358, 40 | 366, 41 | 387, 42 | 411, 43 | 432, 44 | 444, 45 | 470, 46 | 481, 47 | 484, 48 | 490, 49 | 512, 50 | 522, 51 | 526, 52 | 545, 53 | 548, 54 | 554, 55 | 555, 56 | 561, 57 | 571, 58 | 579, 59 | 594, 60 | 603, 61 | 611, 62 | 620, 63 | 623, 64 | 634, 65 | 654, 66 | 658, 67 | 662, 68 | 665, 69 | 667, 70 | 684, 71 | 691, 72 | 697, 73 | 709, 74 | 722, 75 | 746, 76 | 755, 77 | 777, 78 | 779, 79 | 792, 80 | 814, 81 | 838, 82 | 848, 83 | 859, 84 | 863, 85 | 865, 86 | 871, 87 | 873, 88 | 893, 89 | 912, 90 | 918, 91 | 924, 92 | 929, 93 | 932, 94 | 933, 95 | 944, 96 | 949, 97 | 952, 98 | 953, 99 | 977, 100 | 983, 101 | 984, 102 | 997, 103 | 1003 104 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 21, 4 | 24, 5 | 34, 6 | 71, 7 | 74, 8 | 78, 9 | 130, 10 | 145, 11 | 155, 12 | 156, 13 | 158, 14 | 159, 15 | 179, 16 | 222, 17 | 224, 18 | 253, 19 | 261, 20 | 285, 21 | 286, 22 | 290, 23 | 311, 24 | 324, 25 | 326, 26 | 327, 27 | 328, 28 | 330, 29 | 339, 30 | 357, 31 | 360, 32 | 363, 33 | 383, 34 | 390, 35 | 424, 36 | 425, 37 | 436, 38 | 437, 39 | 449, 40 | 463, 41 | 464, 42 | 469, 43 | 479, 44 | 489, 45 | 496, 46 | 502, 47 | 504, 48 | 513, 49 | 516, 50 | 525, 51 | 530, 52 | 559, 53 | 574, 54 | 575, 55 | 581, 56 | 586, 57 | 588, 58 | 599, 59 | 613, 60 | 617, 61 | 619, 62 | 622, 63 | 631, 64 | 636, 65 | 645, 66 | 647, 67 | 653, 68 | 656, 69 | 657, 70 | 660, 71 | 672, 72 | 692, 73 | 693, 74 | 699, 75 | 704, 76 | 760, 77 | 770, 78 | 771, 79 | 783, 80 | 793, 81 | 806, 82 | 827, 83 | 829, 84 | 845, 85 | 849, 86 | 851, 87 | 882, 88 | 887, 89 | 890, 90 | 891, 91 | 899, 92 | 900, 93 | 907, 94 | 927, 95 | 930, 96 | 946, 97 | 962, 98 | 971, 99 | 987, 100 | 992, 101 | 995, 102 | 1005 103 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 9, 3 | 25, 4 | 26, 5 | 36, 6 | 44, 7 | 54, 8 | 59, 9 | 65, 10 | 67, 11 | 90, 12 | 92, 13 | 104, 14 | 114, 15 | 124, 16 | 133, 17 | 141, 18 | 146, 19 | 164, 20 | 169, 21 | 174, 22 | 178, 23 | 204, 24 | 209, 25 | 220, 26 | 221, 27 | 232, 28 | 234, 29 | 240, 30 | 241, 31 | 256, 32 | 258, 33 | 276, 34 | 287, 35 | 325, 36 | 331, 37 | 334, 38 | 356, 39 | 393, 40 | 398, 41 | 401, 42 | 405, 43 | 415, 44 | 426, 45 | 446, 46 | 455, 47 | 456, 48 | 465, 49 | 471, 50 | 485, 51 | 486, 52 | 493, 53 | 501, 54 | 532, 55 | 533, 56 | 542, 57 | 547, 58 | 572, 59 | 573, 60 | 595, 61 | 602, 62 | 618, 63 | 630, 64 | 638, 65 | 651, 66 | 652, 67 | 655, 68 | 670, 69 | 673, 70 | 689, 71 | 695, 72 | 696, 73 | 711, 74 | 712, 75 | 729, 76 | 742, 77 | 751, 78 | 762, 79 | 764, 80 | 765, 81 | 776, 82 | 782, 83 | 784, 84 | 786, 85 | 801, 86 | 804, 87 | 807, 88 | 819, 89 | 842, 90 | 854, 91 | 884, 92 | 888, 93 | 914, 94 | 915, 95 | 919, 96 | 928, 97 | 936, 98 | 947, 99 | 968, 100 | 970, 101 | 1002, 102 | 1009 103 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/enron/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 4, 3 | 5, 4 | 10, 5 | 14, 6 | 22, 7 | 23, 8 | 40, 9 | 47, 10 | 50, 11 | 57, 12 | 60, 13 | 69, 14 | 80, 15 | 86, 16 | 87, 17 | 95, 18 | 97, 19 | 109, 20 | 137, 21 | 140, 22 | 152, 23 | 153, 24 | 162, 25 | 171, 26 | 177, 27 | 181, 28 | 191, 29 | 212, 30 | 215, 31 | 229, 32 | 257, 33 | 272, 34 | 297, 35 | 307, 36 | 338, 37 | 368, 38 | 373, 39 | 396, 40 | 408, 41 | 414, 42 | 417, 43 | 419, 44 | 427, 45 | 429, 46 | 451, 47 | 468, 48 | 473, 49 | 517, 50 | 521, 51 | 529, 52 | 541, 53 | 549, 54 | 570, 55 | 577, 56 | 578, 57 | 585, 58 | 598, 59 | 604, 60 | 615, 61 | 616, 62 | 632, 63 | 633, 64 | 635, 65 | 648, 66 | 649, 67 | 675, 68 | 676, 69 | 677, 70 | 681, 71 | 682, 72 | 685, 73 | 688, 74 | 700, 75 | 721, 76 | 733, 77 | 740, 78 | 748, 79 | 752, 80 | 754, 81 | 767, 82 | 773, 83 | 797, 84 | 811, 85 | 824, 86 | 833, 87 | 834, 88 | 841, 89 | 853, 90 | 855, 91 | 875, 92 | 879, 93 | 901, 94 | 931, 95 | 935, 96 | 940, 97 | 954, 98 | 955, 99 | 956, 100 | 961 101 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 31, 3 | 46, 4 | 54, 5 | 55, 6 | 61, 7 | 64, 8 | 80, 9 | 84, 10 | 89, 11 | 93, 12 | 97, 13 | 112, 14 | 120, 15 | 135, 16 | 153, 17 | 155 18 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 3, 4 | 13, 5 | 17, 6 | 18, 7 | 43, 8 | 58, 9 | 66, 10 | 88, 11 | 99, 12 | 110, 13 | 114, 14 | 137, 15 | 141 16 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 5, 3 | 7, 4 | 24, 5 | 29, 6 | 50, 7 | 59, 8 | 67, 9 | 71, 10 | 75, 11 | 78, 12 | 79, 13 | 95, 14 | 108, 15 | 117, 16 | 122, 17 | 134, 18 | 138, 19 | 147 20 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 9, 3 | 15, 4 | 35, 5 | 47, 6 | 68, 7 | 69, 8 | 91, 9 | 109, 10 | 113, 11 | 116, 12 | 118, 13 | 119, 14 | 136, 15 | 148, 16 | 150 17 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 11, 3 | 27, 4 | 40, 5 | 49, 6 | 53, 7 | 92, 8 | 94, 9 | 105, 10 | 126, 11 | 156 12 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 12, 3 | 20, 4 | 26, 5 | 34, 6 | 62, 7 | 65, 8 | 77, 9 | 82, 10 | 98, 11 | 101, 12 | 121, 13 | 143, 14 | 152 15 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 6, 3 | 14, 4 | 16, 5 | 28, 6 | 37, 7 | 39, 8 | 44, 9 | 45, 10 | 48, 11 | 52, 12 | 56, 13 | 63, 14 | 73, 15 | 100, 16 | 129, 17 | 140, 18 | 142, 19 | 146, 20 | 151, 21 | 154 22 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 1, 4 | 4, 5 | 10, 6 | 19, 7 | 22, 8 | 30, 9 | 38, 10 | 57, 11 | 70, 12 | 81, 13 | 83, 14 | 87, 15 | 90, 16 | 102, 17 | 103, 18 | 106, 19 | 111, 20 | 127, 21 | 130, 22 | 144 23 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 21, 3 | 23, 4 | 25, 5 | 32, 6 | 41, 7 | 42, 8 | 51, 9 | 60, 10 | 72, 11 | 76, 12 | 86, 13 | 107, 14 | 128, 15 | 131, 16 | 132, 17 | 133, 18 | 149 19 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/europarl/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 8, 3 | 33, 4 | 36, 5 | 74, 6 | 85, 7 | 96, 8 | 104, 9 | 115, 10 | 123, 11 | 124, 12 | 125, 13 | 139, 14 | 145 15 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/freelaw/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 6, 4 | 16, 5 | 21, 6 | 25, 7 | 33, 8 | 43, 9 | 59, 10 | 62, 11 | 83, 12 | 103, 13 | 108, 14 | 109, 15 | 136, 16 | 146, 17 | 175, 18 | 186, 19 | 192, 20 | 194, 21 | 195, 22 | 203, 23 | 214, 24 | 221, 25 | 281, 26 | 283, 27 | 310, 28 | 321, 29 | 343, 30 | 365, 31 | 384, 32 | 385, 33 | 410, 34 | 412, 35 | 427, 36 | 432, 37 | 440, 38 | 451, 39 | 453, 40 | 463, 41 | 469, 42 | 476, 43 | 506, 44 | 512, 45 | 519, 46 | 522, 47 | 539, 48 | 542, 49 | 592, 50 | 594, 51 | 613, 52 | 629, 53 | 640, 54 | 647, 55 | 648, 56 | 656, 57 | 676, 58 | 700, 59 | 703, 60 | 754, 61 | 769, 62 | 787, 63 | 793, 64 | 808, 65 | 812, 66 | 817, 67 | 829, 68 | 834, 69 | 839, 70 | 843, 71 | 853, 72 | 856, 73 | 862, 74 | 867, 75 | 870, 76 | 875, 77 | 876, 78 | 877, 79 | 878, 80 | 879, 81 | 884, 82 | 886, 83 | 900, 84 | 911, 85 | 917, 86 | 939, 87 | 944, 88 | 946, 89 | 956, 90 | 969, 91 | 981, 92 | 995, 93 | 1003, 94 | 1004, 95 | 1010, 96 | 1020, 97 | 1021, 98 | 1057, 99 | 1060, 100 | 1066, 101 | 1068, 102 | 1070, 103 | 1083, 104 | 1084, 105 | 1093, 106 | 1094, 107 | 1102, 108 | 1117, 109 | 1123, 110 | 1129, 111 | 1139, 112 | 1141, 113 | 1151, 114 | 1167, 115 | 1176, 116 | 1188, 117 | 1190, 118 | 1197, 119 | 1214, 120 | 1219, 121 | 1231, 122 | 1236, 123 | 1251, 124 | 1261, 125 | 1267, 126 | 1274, 127 | 1293, 128 | 1294, 129 | 1300, 130 | 1302, 131 | 1306, 132 | 1307, 133 | 1308, 134 | 1309, 135 | 1314, 136 | 1327, 137 | 1337, 138 | 1346, 139 | 1355, 140 | 1364, 141 | 1374, 142 | 1382, 143 | 1384, 144 | 1390, 145 | 1396, 146 | 1400, 147 | 1403, 148 | 1422, 149 | 1437, 150 | 1447, 151 | 1453, 152 | 1459, 153 | 1466, 154 | 1499, 155 | 1515, 156 | 1523, 157 | 1528, 158 | 1553, 159 | 1556, 160 | 1567, 161 | 1603, 162 | 1606, 163 | 1607, 164 | 1620, 165 | 1629, 166 | 1660, 167 | 1701, 168 | 1728, 169 | 1735, 170 | 1743, 171 | 1765, 172 | 1775, 173 | 1778, 174 | 1779, 175 | 1816, 176 | 1834, 177 | 1839, 178 | 1852, 179 | 1868, 180 | 1878, 181 | 1884, 182 | 1890, 183 | 1910, 184 | 1917, 185 | 1939, 186 | 1945, 187 | 1946, 188 | 1950, 189 | 1991, 190 | 1992, 191 | 2006, 192 | 2038, 193 | 2045, 194 | 2060, 195 | 2076, 196 | 2079, 197 | 2089, 198 | 2092, 199 | 2096, 200 | 2099, 201 | 2121, 202 | 2133, 203 | 2135, 204 | 2138, 205 | 2143, 206 | 2157, 207 | 2163, 208 | 2164, 209 | 2167, 210 | 2183, 211 | 2190, 212 | 2195, 213 | 2197, 214 | 2206, 215 | 2223, 216 | 2236, 217 | 2249, 218 | 2261, 219 | 2263, 220 | 2272, 221 | 2276, 222 | 2279, 223 | 2297, 224 | 2310, 225 | 2325, 226 | 2330, 227 | 2344, 228 | 2372, 229 | 2376, 230 | 2378, 231 | 2385, 232 | 2394, 233 | 2395, 234 | 2405, 235 | 2406, 236 | 2410, 237 | 2416, 238 | 2426, 239 | 2435, 240 | 2443, 241 | 2446, 242 | 2447, 243 | 2448, 244 | 2468, 245 | 2503, 246 | 2510, 247 | 2511, 248 | 2519, 249 | 2560, 250 | 2562, 251 | 2567, 252 | 2575, 253 | 2586, 254 | 2591, 255 | 2611, 256 | 2612, 257 | 2616, 258 | 2629, 259 | 2632, 260 | 2637, 261 | 2644, 262 | 2647, 263 | 2652, 264 | 2672, 265 | 2675, 266 | 2684, 267 | 2691, 268 | 2694, 269 | 2706, 270 | 2715, 271 | 2721, 272 | 2755, 273 | 2764, 274 | 2771, 275 | 2780, 276 | 2789, 277 | 2792, 278 | 2808, 279 | 2812, 280 | 2816, 281 | 2825, 282 | 2831, 283 | 2837, 284 | 2841, 285 | 2847, 286 | 2849, 287 | 2861, 288 | 2863, 289 | 2917, 290 | 2930, 291 | 2948, 292 | 2958, 293 | 2964, 294 | 2967, 295 | 2997, 296 | 3001, 297 | 3005, 298 | 3008, 299 | 3022, 300 | 3024, 301 | 3028, 302 | 3046, 303 | 3051, 304 | 3055, 305 | 3059, 306 | 3068, 307 | 3085, 308 | 3088, 309 | 3089, 310 | 3092, 311 | 3095, 312 | 3112, 313 | 3117, 314 | 3133, 315 | 3152, 316 | 3157, 317 | 3164, 318 | 3194, 319 | 3199, 320 | 3207, 321 | 3218, 322 | 3224, 323 | 3228, 324 | 3229, 325 | 3236, 326 | 3251, 327 | 3263, 328 | 3268, 329 | 3277, 330 | 3278, 331 | 3283, 332 | 3297, 333 | 3305, 334 | 3307, 335 | 3308, 336 | 3317, 337 | 3343, 338 | 3353, 339 | 3382, 340 | 3384, 341 | 3385, 342 | 3392, 343 | 3396, 344 | 3410, 345 | 3417, 346 | 3430, 347 | 3431, 348 | 3456, 349 | 3470, 350 | 3500, 351 | 3504, 352 | 3516, 353 | 3525, 354 | 3530, 355 | 3544, 356 | 3554, 357 | 3565, 358 | 3572, 359 | 3579, 360 | 3586, 361 | 3607, 362 | 3618, 363 | 3619, 364 | 3622, 365 | 3631, 366 | 3644, 367 | 3648, 368 | 3659, 369 | 3666, 370 | 3669, 371 | 3683, 372 | 3689, 373 | 3699, 374 | 3701, 375 | 3726, 376 | 3733, 377 | 3738, 378 | 3747, 379 | 3750, 380 | 3768, 381 | 3770, 382 | 3781, 383 | 3790, 384 | 3815, 385 | 3821, 386 | 3841, 387 | 3847, 388 | 3870, 389 | 3908, 390 | 3910, 391 | 3917, 392 | 3928, 393 | 3950, 394 | 3955, 395 | 3982, 396 | 4012, 397 | 4035, 398 | 4036, 399 | 4041, 400 | 4044, 401 | 4045, 402 | 4063, 403 | 4064, 404 | 4072, 405 | 4088, 406 | 4108, 407 | 4109, 408 | 4119, 409 | 4139, 410 | 4141, 411 | 4160, 412 | 4170, 413 | 4174, 414 | 4185, 415 | 4204, 416 | 4212, 417 | 4216, 418 | 4233, 419 | 4245, 420 | 4249, 421 | 4264, 422 | 4282, 423 | 4293, 424 | 4306, 425 | 4314, 426 | 4316, 427 | 4320, 428 | 4321, 429 | 4342, 430 | 4343, 431 | 4347, 432 | 4384, 433 | 4387, 434 | 4390, 435 | 4401, 436 | 4453, 437 | 4458, 438 | 4467, 439 | 4472, 440 | 4474, 441 | 4482, 442 | 4488, 443 | 4527, 444 | 4530, 445 | 4531, 446 | 4539, 447 | 4544, 448 | 4560, 449 | 4587, 450 | 4595, 451 | 4601, 452 | 4613, 453 | 4618, 454 | 4620, 455 | 4641, 456 | 4659, 457 | 4661, 458 | 4667, 459 | 4668, 460 | 4681, 461 | 4686, 462 | 4692, 463 | 4695, 464 | 4706, 465 | 4716, 466 | 4719, 467 | 4721, 468 | 4725, 469 | 4731, 470 | 4737, 471 | 4746, 472 | 4751, 473 | 4758, 474 | 4775, 475 | 4778, 476 | 4782, 477 | 4798, 478 | 4817, 479 | 4823, 480 | 4839, 481 | 4851, 482 | 4868, 483 | 4869, 484 | 4931, 485 | 4939, 486 | 4940, 487 | 4950, 488 | 4971, 489 | 4977, 490 | 4993, 491 | 4996, 492 | 5011, 493 | 5020, 494 | 5024, 495 | 5038, 496 | 5042, 497 | 5096 498 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/freelaw/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 7, 3 | 23, 4 | 34, 5 | 63, 6 | 71, 7 | 86, 8 | 92, 9 | 93, 10 | 94, 11 | 104, 12 | 114, 13 | 115, 14 | 117, 15 | 128, 16 | 135, 17 | 150, 18 | 158, 19 | 159, 20 | 165, 21 | 166, 22 | 199, 23 | 205, 24 | 217, 25 | 233, 26 | 242, 27 | 257, 28 | 260, 29 | 269, 30 | 279, 31 | 290, 32 | 316, 33 | 330, 34 | 340, 35 | 344, 36 | 349, 37 | 352, 38 | 355, 39 | 359, 40 | 371, 41 | 387, 42 | 402, 43 | 417, 44 | 446, 45 | 448, 46 | 454, 47 | 458, 48 | 465, 49 | 468, 50 | 473, 51 | 478, 52 | 487, 53 | 492, 54 | 531, 55 | 561, 56 | 566, 57 | 586, 58 | 589, 59 | 590, 60 | 591, 61 | 598, 62 | 603, 63 | 612, 64 | 620, 65 | 635, 66 | 662, 67 | 674, 68 | 679, 69 | 680, 70 | 683, 71 | 684, 72 | 688, 73 | 714, 74 | 726, 75 | 730, 76 | 732, 77 | 749, 78 | 755, 79 | 763, 80 | 764, 81 | 772, 82 | 781, 83 | 792, 84 | 803, 85 | 804, 86 | 814, 87 | 850, 88 | 859, 89 | 863, 90 | 866, 91 | 887, 92 | 904, 93 | 910, 94 | 916, 95 | 922, 96 | 961, 97 | 968, 98 | 971, 99 | 973, 100 | 975, 101 | 978, 102 | 985, 103 | 987, 104 | 996, 105 | 1030, 106 | 1034, 107 | 1042, 108 | 1045, 109 | 1050, 110 | 1071, 111 | 1075, 112 | 1086, 113 | 1143, 114 | 1154, 115 | 1159, 116 | 1173, 117 | 1175, 118 | 1192, 119 | 1193, 120 | 1202, 121 | 1203, 122 | 1225, 123 | 1230, 124 | 1233, 125 | 1234, 126 | 1240, 127 | 1244, 128 | 1250, 129 | 1270, 130 | 1273, 131 | 1279, 132 | 1292, 133 | 1319, 134 | 1329, 135 | 1332, 136 | 1343, 137 | 1347, 138 | 1360, 139 | 1397, 140 | 1408, 141 | 1410, 142 | 1415, 143 | 1417, 144 | 1420, 145 | 1423, 146 | 1431, 147 | 1446, 148 | 1454, 149 | 1471, 150 | 1473, 151 | 1476, 152 | 1496, 153 | 1498, 154 | 1514, 155 | 1532, 156 | 1540, 157 | 1542, 158 | 1552, 159 | 1562, 160 | 1571, 161 | 1584, 162 | 1587, 163 | 1589, 164 | 1609, 165 | 1623, 166 | 1630, 167 | 1631, 168 | 1641, 169 | 1642, 170 | 1643, 171 | 1645, 172 | 1647, 173 | 1653, 174 | 1663, 175 | 1699, 176 | 1724, 177 | 1730, 178 | 1736, 179 | 1766, 180 | 1767, 181 | 1768, 182 | 1771, 183 | 1780, 184 | 1793, 185 | 1798, 186 | 1803, 187 | 1811, 188 | 1813, 189 | 1825, 190 | 1830, 191 | 1837, 192 | 1845, 193 | 1855, 194 | 1859, 195 | 1861, 196 | 1872, 197 | 1873, 198 | 1874, 199 | 1877, 200 | 1902, 201 | 1903, 202 | 1905, 203 | 1906, 204 | 1908, 205 | 1914, 206 | 1919, 207 | 1938, 208 | 1953, 209 | 1959, 210 | 1963, 211 | 1975, 212 | 1982, 213 | 1983, 214 | 1989, 215 | 2007, 216 | 2013, 217 | 2014, 218 | 2016, 219 | 2031, 220 | 2032, 221 | 2039, 222 | 2044, 223 | 2063, 224 | 2067, 225 | 2074, 226 | 2085, 227 | 2086, 228 | 2087, 229 | 2098, 230 | 2105, 231 | 2106, 232 | 2120, 233 | 2150, 234 | 2165, 235 | 2174, 236 | 2175, 237 | 2184, 238 | 2222, 239 | 2258, 240 | 2268, 241 | 2269, 242 | 2271, 243 | 2294, 244 | 2298, 245 | 2308, 246 | 2318, 247 | 2336, 248 | 2342, 249 | 2346, 250 | 2353, 251 | 2371, 252 | 2379, 253 | 2387, 254 | 2392, 255 | 2393, 256 | 2407, 257 | 2414, 258 | 2423, 259 | 2463, 260 | 2486, 261 | 2496, 262 | 2500, 263 | 2508, 264 | 2517, 265 | 2549, 266 | 2550, 267 | 2552, 268 | 2557, 269 | 2563, 270 | 2571, 271 | 2582, 272 | 2593, 273 | 2617, 274 | 2621, 275 | 2625, 276 | 2631, 277 | 2636, 278 | 2639, 279 | 2640, 280 | 2649, 281 | 2650, 282 | 2663, 283 | 2670, 284 | 2701, 285 | 2702, 286 | 2722, 287 | 2739, 288 | 2759, 289 | 2787, 290 | 2791, 291 | 2824, 292 | 2828, 293 | 2862, 294 | 2866, 295 | 2885, 296 | 2897, 297 | 2901, 298 | 2908, 299 | 2927, 300 | 2946, 301 | 2992, 302 | 2996, 303 | 3016, 304 | 3027, 305 | 3041, 306 | 3047, 307 | 3050, 308 | 3053, 309 | 3056, 310 | 3057, 311 | 3066, 312 | 3081, 313 | 3099, 314 | 3100, 315 | 3101, 316 | 3102, 317 | 3106, 318 | 3114, 319 | 3138, 320 | 3147, 321 | 3158, 322 | 3166, 323 | 3169, 324 | 3173, 325 | 3176, 326 | 3193, 327 | 3202, 328 | 3211, 329 | 3242, 330 | 3253, 331 | 3256, 332 | 3264, 333 | 3271, 334 | 3282, 335 | 3295, 336 | 3299, 337 | 3309, 338 | 3311, 339 | 3322, 340 | 3329, 341 | 3358, 342 | 3361, 343 | 3409, 344 | 3411, 345 | 3424, 346 | 3428, 347 | 3446, 348 | 3450, 349 | 3455, 350 | 3457, 351 | 3461, 352 | 3472, 353 | 3481, 354 | 3482, 355 | 3486, 356 | 3509, 357 | 3511, 358 | 3518, 359 | 3523, 360 | 3524, 361 | 3529, 362 | 3531, 363 | 3543, 364 | 3555, 365 | 3570, 366 | 3571, 367 | 3574, 368 | 3575, 369 | 3583, 370 | 3587, 371 | 3613, 372 | 3617, 373 | 3627, 374 | 3667, 375 | 3670, 376 | 3677, 377 | 3694, 378 | 3695, 379 | 3696, 380 | 3712, 381 | 3731, 382 | 3742, 383 | 3746, 384 | 3756, 385 | 3778, 386 | 3782, 387 | 3783, 388 | 3793, 389 | 3794, 390 | 3806, 391 | 3812, 392 | 3830, 393 | 3837, 394 | 3848, 395 | 3852, 396 | 3853, 397 | 3854, 398 | 3856, 399 | 3861, 400 | 3879, 401 | 3883, 402 | 3895, 403 | 3904, 404 | 3907, 405 | 3909, 406 | 3920, 407 | 3922, 408 | 3925, 409 | 3933, 410 | 3935, 411 | 3937, 412 | 3952, 413 | 3957, 414 | 3985, 415 | 3986, 416 | 3990, 417 | 3996, 418 | 4023, 419 | 4026, 420 | 4030, 421 | 4033, 422 | 4040, 423 | 4043, 424 | 4050, 425 | 4057, 426 | 4071, 427 | 4099, 428 | 4104, 429 | 4116, 430 | 4126, 431 | 4128, 432 | 4132, 433 | 4133, 434 | 4137, 435 | 4140, 436 | 4146, 437 | 4150, 438 | 4162, 439 | 4177, 440 | 4182, 441 | 4200, 442 | 4210, 443 | 4224, 444 | 4244, 445 | 4248, 446 | 4250, 447 | 4253, 448 | 4259, 449 | 4260, 450 | 4263, 451 | 4265, 452 | 4266, 453 | 4279, 454 | 4281, 455 | 4301, 456 | 4303, 457 | 4322, 458 | 4323, 459 | 4329, 460 | 4336, 461 | 4339, 462 | 4369, 463 | 4380, 464 | 4411, 465 | 4413, 466 | 4419, 467 | 4432, 468 | 4433, 469 | 4439, 470 | 4442, 471 | 4443, 472 | 4455, 473 | 4468, 474 | 4496, 475 | 4502, 476 | 4510, 477 | 4513, 478 | 4515, 479 | 4517, 480 | 4540, 481 | 4551, 482 | 4562, 483 | 4569, 484 | 4571, 485 | 4579, 486 | 4580, 487 | 4581, 488 | 4583, 489 | 4604, 490 | 4627, 491 | 4637, 492 | 4655, 493 | 4660, 494 | 4669, 495 | 4676, 496 | 4687, 497 | 4688, 498 | 4703, 499 | 4704, 500 | 4748, 501 | 4819, 502 | 4820, 503 | 4871, 504 | 4873, 505 | 4875, 506 | 4883, 507 | 4889, 508 | 4907, 509 | 4911, 510 | 4913, 511 | 4915, 512 | 4916, 513 | 4922, 514 | 4925, 515 | 4932, 516 | 4945, 517 | 4978, 518 | 4992, 519 | 4995, 520 | 4999, 521 | 5009, 522 | 5051, 523 | 5056, 524 | 5061, 525 | 5062, 526 | 5072, 527 | 5073, 528 | 5079, 529 | 5084, 530 | 5086, 531 | 5087 532 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/freelaw/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 5, 3 | 8, 4 | 22, 5 | 38, 6 | 51, 7 | 66, 8 | 77, 9 | 88, 10 | 119, 11 | 124, 12 | 162, 13 | 172, 14 | 177, 15 | 181, 16 | 183, 17 | 196, 18 | 198, 19 | 210, 20 | 212, 21 | 227, 22 | 235, 23 | 237, 24 | 240, 25 | 275, 26 | 296, 27 | 313, 28 | 314, 29 | 320, 30 | 332, 31 | 337, 32 | 351, 33 | 353, 34 | 367, 35 | 368, 36 | 372, 37 | 380, 38 | 381, 39 | 388, 40 | 391, 41 | 392, 42 | 397, 43 | 409, 44 | 424, 45 | 425, 46 | 435, 47 | 438, 48 | 443, 49 | 449, 50 | 450, 51 | 455, 52 | 466, 53 | 474, 54 | 480, 55 | 516, 56 | 517, 57 | 528, 58 | 536, 59 | 538, 60 | 540, 61 | 549, 62 | 553, 63 | 575, 64 | 582, 65 | 605, 66 | 609, 67 | 634, 68 | 643, 69 | 644, 70 | 660, 71 | 671, 72 | 701, 73 | 702, 74 | 704, 75 | 707, 76 | 715, 77 | 716, 78 | 719, 79 | 742, 80 | 774, 81 | 775, 82 | 786, 83 | 799, 84 | 818, 85 | 822, 86 | 828, 87 | 831, 88 | 840, 89 | 844, 90 | 885, 91 | 897, 92 | 905, 93 | 927, 94 | 936, 95 | 977, 96 | 989, 97 | 1000, 98 | 1007, 99 | 1011, 100 | 1012, 101 | 1077, 102 | 1095, 103 | 1100, 104 | 1101, 105 | 1105, 106 | 1116, 107 | 1124, 108 | 1127, 109 | 1140, 110 | 1150, 111 | 1160, 112 | 1171, 113 | 1177, 114 | 1215, 115 | 1228, 116 | 1237, 117 | 1239, 118 | 1241, 119 | 1242, 120 | 1246, 121 | 1249, 122 | 1254, 123 | 1280, 124 | 1281, 125 | 1287, 126 | 1322, 127 | 1328, 128 | 1370, 129 | 1376, 130 | 1380, 131 | 1393, 132 | 1425, 133 | 1426, 134 | 1428, 135 | 1429, 136 | 1440, 137 | 1441, 138 | 1448, 139 | 1465, 140 | 1474, 141 | 1479, 142 | 1485, 143 | 1487, 144 | 1492, 145 | 1501, 146 | 1508, 147 | 1512, 148 | 1549, 149 | 1554, 150 | 1583, 151 | 1594, 152 | 1598, 153 | 1600, 154 | 1602, 155 | 1608, 156 | 1617, 157 | 1622, 158 | 1632, 159 | 1644, 160 | 1652, 161 | 1670, 162 | 1675, 163 | 1678, 164 | 1679, 165 | 1687, 166 | 1702, 167 | 1706, 168 | 1710, 169 | 1737, 170 | 1741, 171 | 1744, 172 | 1749, 173 | 1762, 174 | 1772, 175 | 1789, 176 | 1795, 177 | 1800, 178 | 1810, 179 | 1819, 180 | 1827, 181 | 1831, 182 | 1842, 183 | 1862, 184 | 1879, 185 | 1888, 186 | 1920, 187 | 1924, 188 | 1936, 189 | 1944, 190 | 1951, 191 | 1954, 192 | 1961, 193 | 1966, 194 | 1972, 195 | 1977, 196 | 1987, 197 | 1994, 198 | 1996, 199 | 1997, 200 | 2029, 201 | 2030, 202 | 2035, 203 | 2042, 204 | 2075, 205 | 2082, 206 | 2091, 207 | 2093, 208 | 2107, 209 | 2129, 210 | 2142, 211 | 2171, 212 | 2172, 213 | 2179, 214 | 2182, 215 | 2194, 216 | 2201, 217 | 2208, 218 | 2209, 219 | 2219, 220 | 2227, 221 | 2230, 222 | 2248, 223 | 2255, 224 | 2287, 225 | 2304, 226 | 2316, 227 | 2320, 228 | 2335, 229 | 2349, 230 | 2357, 231 | 2358, 232 | 2397, 233 | 2402, 234 | 2403, 235 | 2418, 236 | 2434, 237 | 2436, 238 | 2449, 239 | 2456, 240 | 2467, 241 | 2476, 242 | 2481, 243 | 2487, 244 | 2498, 245 | 2499, 246 | 2522, 247 | 2539, 248 | 2579, 249 | 2580, 250 | 2598, 251 | 2607, 252 | 2638, 253 | 2645, 254 | 2676, 255 | 2682, 256 | 2688, 257 | 2692, 258 | 2698, 259 | 2704, 260 | 2705, 261 | 2716, 262 | 2720, 263 | 2732, 264 | 2748, 265 | 2756, 266 | 2767, 267 | 2795, 268 | 2801, 269 | 2813, 270 | 2817, 271 | 2821, 272 | 2864, 273 | 2870, 274 | 2876, 275 | 2877, 276 | 2882, 277 | 2889, 278 | 2913, 279 | 2938, 280 | 2939, 281 | 2951, 282 | 2959, 283 | 2961, 284 | 2969, 285 | 2975, 286 | 2976, 287 | 3014, 288 | 3023, 289 | 3033, 290 | 3035, 291 | 3042, 292 | 3064, 293 | 3065, 294 | 3073, 295 | 3105, 296 | 3111, 297 | 3118, 298 | 3119, 299 | 3125, 300 | 3136, 301 | 3162, 302 | 3167, 303 | 3172, 304 | 3179, 305 | 3182, 306 | 3190, 307 | 3203, 308 | 3219, 309 | 3231, 310 | 3234, 311 | 3246, 312 | 3249, 313 | 3257, 314 | 3261, 315 | 3284, 316 | 3288, 317 | 3306, 318 | 3314, 319 | 3340, 320 | 3349, 321 | 3357, 322 | 3359, 323 | 3367, 324 | 3368, 325 | 3375, 326 | 3414, 327 | 3418, 328 | 3423, 329 | 3427, 330 | 3432, 331 | 3440, 332 | 3449, 333 | 3458, 334 | 3467, 335 | 3474, 336 | 3476, 337 | 3478, 338 | 3493, 339 | 3497, 340 | 3498, 341 | 3521, 342 | 3528, 343 | 3547, 344 | 3548, 345 | 3568, 346 | 3582, 347 | 3585, 348 | 3594, 349 | 3599, 350 | 3643, 351 | 3663, 352 | 3681, 353 | 3690, 354 | 3691, 355 | 3698, 356 | 3710, 357 | 3717, 358 | 3720, 359 | 3729, 360 | 3732, 361 | 3734, 362 | 3740, 363 | 3745, 364 | 3760, 365 | 3762, 366 | 3763, 367 | 3771, 368 | 3773, 369 | 3786, 370 | 3789, 371 | 3792, 372 | 3809, 373 | 3813, 374 | 3824, 375 | 3827, 376 | 3846, 377 | 3855, 378 | 3864, 379 | 3871, 380 | 3893, 381 | 3897, 382 | 3912, 383 | 3938, 384 | 3942, 385 | 3947, 386 | 3954, 387 | 3964, 388 | 3974, 389 | 3979, 390 | 3991, 391 | 3993, 392 | 3998, 393 | 4011, 394 | 4016, 395 | 4034, 396 | 4039, 397 | 4058, 398 | 4069, 399 | 4073, 400 | 4074, 401 | 4095, 402 | 4107, 403 | 4113, 404 | 4117, 405 | 4124, 406 | 4129, 407 | 4130, 408 | 4135, 409 | 4143, 410 | 4151, 411 | 4165, 412 | 4171, 413 | 4175, 414 | 4176, 415 | 4188, 416 | 4199, 417 | 4206, 418 | 4220, 419 | 4225, 420 | 4237, 421 | 4241, 422 | 4269, 423 | 4280, 424 | 4287, 425 | 4294, 426 | 4296, 427 | 4297, 428 | 4310, 429 | 4311, 430 | 4312, 431 | 4361, 432 | 4376, 433 | 4386, 434 | 4388, 435 | 4392, 436 | 4400, 437 | 4406, 438 | 4422, 439 | 4426, 440 | 4428, 441 | 4437, 442 | 4449, 443 | 4450, 444 | 4460, 445 | 4461, 446 | 4466, 447 | 4475, 448 | 4499, 449 | 4505, 450 | 4507, 451 | 4509, 452 | 4518, 453 | 4529, 454 | 4533, 455 | 4538, 456 | 4548, 457 | 4552, 458 | 4564, 459 | 4588, 460 | 4593, 461 | 4594, 462 | 4605, 463 | 4611, 464 | 4628, 465 | 4679, 466 | 4680, 467 | 4693, 468 | 4697, 469 | 4730, 470 | 4733, 471 | 4734, 472 | 4735, 473 | 4766, 474 | 4769, 475 | 4777, 476 | 4849, 477 | 4865, 478 | 4878, 479 | 4879, 480 | 4894, 481 | 4895, 482 | 4896, 483 | 4906, 484 | 4926, 485 | 4955, 486 | 4958, 487 | 4964, 488 | 4969, 489 | 4985, 490 | 4989, 491 | 4990, 492 | 4994, 493 | 4997, 494 | 5005, 495 | 5016, 496 | 5029, 497 | 5031, 498 | 5049, 499 | 5058, 500 | 5082, 501 | 5100 502 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/freelaw/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 11, 3 | 29, 4 | 35, 5 | 46, 6 | 85, 7 | 99, 8 | 110, 9 | 111, 10 | 118, 11 | 131, 12 | 144, 13 | 145, 14 | 154, 15 | 161, 16 | 164, 17 | 173, 18 | 176, 19 | 197, 20 | 200, 21 | 206, 22 | 213, 23 | 226, 24 | 228, 25 | 231, 26 | 234, 27 | 239, 28 | 247, 29 | 250, 30 | 254, 31 | 271, 32 | 274, 33 | 282, 34 | 292, 35 | 295, 36 | 297, 37 | 301, 38 | 303, 39 | 305, 40 | 309, 41 | 318, 42 | 323, 43 | 333, 44 | 341, 45 | 348, 46 | 350, 47 | 354, 48 | 358, 49 | 364, 50 | 383, 51 | 396, 52 | 398, 53 | 411, 54 | 413, 55 | 429, 56 | 467, 57 | 472, 58 | 481, 59 | 485, 60 | 488, 61 | 520, 62 | 523, 63 | 530, 64 | 547, 65 | 552, 66 | 574, 67 | 576, 68 | 580, 69 | 587, 70 | 614, 71 | 655, 72 | 657, 73 | 666, 74 | 672, 75 | 681, 76 | 682, 77 | 689, 78 | 690, 79 | 695, 80 | 698, 81 | 705, 82 | 709, 83 | 721, 84 | 722, 85 | 724, 86 | 745, 87 | 750, 88 | 784, 89 | 788, 90 | 789, 91 | 800, 92 | 809, 93 | 823, 94 | 848, 95 | 880, 96 | 881, 97 | 893, 98 | 901, 99 | 907, 100 | 924, 101 | 928, 102 | 929, 103 | 931, 104 | 938, 105 | 943, 106 | 950, 107 | 955, 108 | 964, 109 | 967, 110 | 988, 111 | 993, 112 | 1002, 113 | 1006, 114 | 1019, 115 | 1023, 116 | 1024, 117 | 1043, 118 | 1053, 119 | 1056, 120 | 1085, 121 | 1114, 122 | 1115, 123 | 1120, 124 | 1122, 125 | 1130, 126 | 1134, 127 | 1148, 128 | 1191, 129 | 1221, 130 | 1253, 131 | 1257, 132 | 1259, 133 | 1265, 134 | 1271, 135 | 1286, 136 | 1290, 137 | 1296, 138 | 1297, 139 | 1303, 140 | 1310, 141 | 1340, 142 | 1359, 143 | 1369, 144 | 1379, 145 | 1383, 146 | 1401, 147 | 1406, 148 | 1418, 149 | 1427, 150 | 1432, 151 | 1483, 152 | 1491, 153 | 1494, 154 | 1505, 155 | 1506, 156 | 1524, 157 | 1535, 158 | 1577, 159 | 1590, 160 | 1604, 161 | 1616, 162 | 1624, 163 | 1638, 164 | 1639, 165 | 1655, 166 | 1662, 167 | 1676, 168 | 1682, 169 | 1686, 170 | 1691, 171 | 1704, 172 | 1712, 173 | 1748, 174 | 1750, 175 | 1753, 176 | 1760, 177 | 1763, 178 | 1783, 179 | 1792, 180 | 1799, 181 | 1801, 182 | 1808, 183 | 1833, 184 | 1841, 185 | 1844, 186 | 1870, 187 | 1876, 188 | 1892, 189 | 1935, 190 | 1943, 191 | 1969, 192 | 2003, 193 | 2025, 194 | 2040, 195 | 2056, 196 | 2069, 197 | 2071, 198 | 2083, 199 | 2103, 200 | 2116, 201 | 2123, 202 | 2124, 203 | 2144, 204 | 2146, 205 | 2168, 206 | 2180, 207 | 2187, 208 | 2202, 209 | 2205, 210 | 2211, 211 | 2220, 212 | 2237, 213 | 2241, 214 | 2246, 215 | 2247, 216 | 2253, 217 | 2275, 218 | 2277, 219 | 2295, 220 | 2306, 221 | 2313, 222 | 2322, 223 | 2324, 224 | 2332, 225 | 2352, 226 | 2364, 227 | 2391, 228 | 2411, 229 | 2458, 230 | 2462, 231 | 2483, 232 | 2484, 233 | 2491, 234 | 2501, 235 | 2509, 236 | 2513, 237 | 2521, 238 | 2529, 239 | 2536, 240 | 2558, 241 | 2568, 242 | 2576, 243 | 2584, 244 | 2588, 245 | 2589, 246 | 2592, 247 | 2596, 248 | 2601, 249 | 2608, 250 | 2624, 251 | 2634, 252 | 2651, 253 | 2657, 254 | 2658, 255 | 2661, 256 | 2662, 257 | 2668, 258 | 2679, 259 | 2683, 260 | 2696, 261 | 2709, 262 | 2711, 263 | 2717, 264 | 2725, 265 | 2730, 266 | 2744, 267 | 2746, 268 | 2757, 269 | 2769, 270 | 2770, 271 | 2814, 272 | 2819, 273 | 2820, 274 | 2826, 275 | 2829, 276 | 2834, 277 | 2853, 278 | 2867, 279 | 2893, 280 | 2900, 281 | 2905, 282 | 2916, 283 | 2920, 284 | 2924, 285 | 2935, 286 | 2965, 287 | 2971, 288 | 2983, 289 | 3006, 290 | 3007, 291 | 3013, 292 | 3020, 293 | 3025, 294 | 3029, 295 | 3038, 296 | 3054, 297 | 3060, 298 | 3061, 299 | 3063, 300 | 3070, 301 | 3071, 302 | 3075, 303 | 3079, 304 | 3082, 305 | 3090, 306 | 3096, 307 | 3135, 308 | 3143, 309 | 3153, 310 | 3161, 311 | 3168, 312 | 3170, 313 | 3181, 314 | 3187, 315 | 3195, 316 | 3204, 317 | 3209, 318 | 3210, 319 | 3225, 320 | 3239, 321 | 3254, 322 | 3260, 323 | 3265, 324 | 3273, 325 | 3286, 326 | 3315, 327 | 3321, 328 | 3332, 329 | 3337, 330 | 3363, 331 | 3364, 332 | 3377, 333 | 3378, 334 | 3380, 335 | 3398, 336 | 3401, 337 | 3402, 338 | 3421, 339 | 3436, 340 | 3445, 341 | 3463, 342 | 3465, 343 | 3508, 344 | 3512, 345 | 3513, 346 | 3515, 347 | 3519, 348 | 3534, 349 | 3562, 350 | 3581, 351 | 3584, 352 | 3588, 353 | 3591, 354 | 3600, 355 | 3611, 356 | 3650, 357 | 3652, 358 | 3658, 359 | 3687, 360 | 3700, 361 | 3716, 362 | 3730, 363 | 3737, 364 | 3772, 365 | 3784, 366 | 3802, 367 | 3805, 368 | 3807, 369 | 3808, 370 | 3825, 371 | 3839, 372 | 3863, 373 | 3867, 374 | 3873, 375 | 3881, 376 | 3885, 377 | 3886, 378 | 3888, 379 | 3890, 380 | 3892, 381 | 3894, 382 | 3896, 383 | 3916, 384 | 3962, 385 | 3963, 386 | 3965, 387 | 3969, 388 | 3983, 389 | 3995, 390 | 3997, 391 | 4010, 392 | 4013, 393 | 4014, 394 | 4021, 395 | 4025, 396 | 4032, 397 | 4042, 398 | 4048, 399 | 4053, 400 | 4055, 401 | 4065, 402 | 4078, 403 | 4091, 404 | 4093, 405 | 4111, 406 | 4122, 407 | 4134, 408 | 4142, 409 | 4152, 410 | 4154, 411 | 4181, 412 | 4197, 413 | 4229, 414 | 4230, 415 | 4231, 416 | 4251, 417 | 4252, 418 | 4262, 419 | 4284, 420 | 4285, 421 | 4289, 422 | 4325, 423 | 4331, 424 | 4335, 425 | 4348, 426 | 4366, 427 | 4372, 428 | 4425, 429 | 4427, 430 | 4435, 431 | 4446, 432 | 4457, 433 | 4477, 434 | 4481, 435 | 4493, 436 | 4494, 437 | 4521, 438 | 4523, 439 | 4543, 440 | 4559, 441 | 4575, 442 | 4600, 443 | 4614, 444 | 4629, 445 | 4634, 446 | 4650, 447 | 4651, 448 | 4653, 449 | 4654, 450 | 4675, 451 | 4690, 452 | 4691, 453 | 4696, 454 | 4711, 455 | 4713, 456 | 4715, 457 | 4723, 458 | 4729, 459 | 4745, 460 | 4752, 461 | 4761, 462 | 4767, 463 | 4785, 464 | 4788, 465 | 4799, 466 | 4808, 467 | 4809, 468 | 4812, 469 | 4815, 470 | 4832, 471 | 4834, 472 | 4861, 473 | 4867, 474 | 4900, 475 | 4909, 476 | 4919, 477 | 4923, 478 | 4928, 479 | 4933, 480 | 4935, 481 | 4936, 482 | 4947, 483 | 4948, 484 | 4949, 485 | 4963, 486 | 4966, 487 | 4967, 488 | 4968, 489 | 4973, 490 | 4986, 491 | 4988, 492 | 5000, 493 | 5017, 494 | 5019, 495 | 5027, 496 | 5030, 497 | 5035, 498 | 5037, 499 | 5039 500 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/freelaw/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 10, 3 | 26, 4 | 36, 5 | 37, 6 | 54, 7 | 55, 8 | 58, 9 | 61, 10 | 76, 11 | 80, 12 | 81, 13 | 87, 14 | 96, 15 | 102, 16 | 106, 17 | 132, 18 | 139, 19 | 140, 20 | 143, 21 | 148, 22 | 156, 23 | 179, 24 | 190, 25 | 191, 26 | 201, 27 | 207, 28 | 225, 29 | 243, 30 | 258, 31 | 261, 32 | 262, 33 | 273, 34 | 285, 35 | 286, 36 | 287, 37 | 319, 38 | 334, 39 | 357, 40 | 404, 41 | 415, 42 | 441, 43 | 445, 44 | 460, 45 | 483, 46 | 496, 47 | 501, 48 | 509, 49 | 524, 50 | 532, 51 | 533, 52 | 535, 53 | 548, 54 | 554, 55 | 563, 56 | 568, 57 | 572, 58 | 584, 59 | 593, 60 | 596, 61 | 619, 62 | 627, 63 | 633, 64 | 642, 65 | 645, 66 | 665, 67 | 669, 68 | 670, 69 | 725, 70 | 728, 71 | 743, 72 | 757, 73 | 760, 74 | 797, 75 | 798, 76 | 807, 77 | 813, 78 | 833, 79 | 838, 80 | 846, 81 | 851, 82 | 852, 83 | 873, 84 | 883, 85 | 913, 86 | 914, 87 | 923, 88 | 930, 89 | 940, 90 | 941, 91 | 954, 92 | 976, 93 | 1017, 94 | 1018, 95 | 1026, 96 | 1044, 97 | 1048, 98 | 1061, 99 | 1065, 100 | 1088, 101 | 1111, 102 | 1128, 103 | 1131, 104 | 1133, 105 | 1145, 106 | 1152, 107 | 1156, 108 | 1165, 109 | 1166, 110 | 1186, 111 | 1189, 112 | 1195, 113 | 1212, 114 | 1252, 115 | 1262, 116 | 1266, 117 | 1288, 118 | 1299, 119 | 1311, 120 | 1320, 121 | 1344, 122 | 1349, 123 | 1351, 124 | 1358, 125 | 1362, 126 | 1366, 127 | 1375, 128 | 1389, 129 | 1405, 130 | 1436, 131 | 1449, 132 | 1455, 133 | 1458, 134 | 1461, 135 | 1464, 136 | 1478, 137 | 1481, 138 | 1482, 139 | 1484, 140 | 1507, 141 | 1517, 142 | 1522, 143 | 1525, 144 | 1527, 145 | 1537, 146 | 1541, 147 | 1566, 148 | 1582, 149 | 1585, 150 | 1611, 151 | 1613, 152 | 1615, 153 | 1621, 154 | 1633, 155 | 1634, 156 | 1636, 157 | 1665, 158 | 1666, 159 | 1671, 160 | 1677, 161 | 1681, 162 | 1683, 163 | 1684, 164 | 1689, 165 | 1703, 166 | 1715, 167 | 1717, 168 | 1722, 169 | 1729, 170 | 1732, 171 | 1733, 172 | 1740, 173 | 1754, 174 | 1759, 175 | 1786, 176 | 1805, 177 | 1809, 178 | 1814, 179 | 1823, 180 | 1857, 181 | 1860, 182 | 1866, 183 | 1886, 184 | 1897, 185 | 1912, 186 | 1922, 187 | 1941, 188 | 1948, 189 | 1967, 190 | 1980, 191 | 2001, 192 | 2008, 193 | 2015, 194 | 2047, 195 | 2057, 196 | 2058, 197 | 2066, 198 | 2112, 199 | 2114, 200 | 2130, 201 | 2149, 202 | 2154, 203 | 2155, 204 | 2161, 205 | 2166, 206 | 2169, 207 | 2188, 208 | 2189, 209 | 2212, 210 | 2213, 211 | 2228, 212 | 2235, 213 | 2251, 214 | 2257, 215 | 2262, 216 | 2265, 217 | 2281, 218 | 2321, 219 | 2326, 220 | 2333, 221 | 2337, 222 | 2343, 223 | 2350, 224 | 2359, 225 | 2360, 226 | 2374, 227 | 2375, 228 | 2399, 229 | 2409, 230 | 2419, 231 | 2424, 232 | 2425, 233 | 2439, 234 | 2450, 235 | 2451, 236 | 2465, 237 | 2466, 238 | 2471, 239 | 2475, 240 | 2488, 241 | 2506, 242 | 2534, 243 | 2535, 244 | 2537, 245 | 2564, 246 | 2572, 247 | 2574, 248 | 2577, 249 | 2581, 250 | 2587, 251 | 2600, 252 | 2606, 253 | 2618, 254 | 2620, 255 | 2641, 256 | 2648, 257 | 2653, 258 | 2669, 259 | 2707, 260 | 2719, 261 | 2723, 262 | 2749, 263 | 2766, 264 | 2774, 265 | 2776, 266 | 2779, 267 | 2785, 268 | 2794, 269 | 2800, 270 | 2804, 271 | 2822, 272 | 2823, 273 | 2832, 274 | 2842, 275 | 2855, 276 | 2856, 277 | 2868, 278 | 2871, 279 | 2874, 280 | 2880, 281 | 2883, 282 | 2884, 283 | 2904, 284 | 2940, 285 | 2949, 286 | 2956, 287 | 2963, 288 | 2970, 289 | 2980, 290 | 2981, 291 | 2999, 292 | 3010, 293 | 3011, 294 | 3015, 295 | 3030, 296 | 3052, 297 | 3058, 298 | 3067, 299 | 3084, 300 | 3098, 301 | 3113, 302 | 3123, 303 | 3137, 304 | 3141, 305 | 3159, 306 | 3165, 307 | 3177, 308 | 3183, 309 | 3205, 310 | 3222, 311 | 3235, 312 | 3243, 313 | 3248, 314 | 3310, 315 | 3312, 316 | 3319, 317 | 3323, 318 | 3347, 319 | 3354, 320 | 3372, 321 | 3381, 322 | 3393, 323 | 3395, 324 | 3400, 325 | 3405, 326 | 3425, 327 | 3442, 328 | 3466, 329 | 3479, 330 | 3485, 331 | 3487, 332 | 3490, 333 | 3495, 334 | 3517, 335 | 3546, 336 | 3550, 337 | 3551, 338 | 3552, 339 | 3556, 340 | 3559, 341 | 3593, 342 | 3596, 343 | 3605, 344 | 3615, 345 | 3626, 346 | 3637, 347 | 3653, 348 | 3654, 349 | 3657, 350 | 3664, 351 | 3673, 352 | 3685, 353 | 3719, 354 | 3721, 355 | 3728, 356 | 3735, 357 | 3739, 358 | 3741, 359 | 3748, 360 | 3758, 361 | 3767, 362 | 3779, 363 | 3797, 364 | 3816, 365 | 3822, 366 | 3845, 367 | 3874, 368 | 3876, 369 | 3877, 370 | 3889, 371 | 3900, 372 | 3903, 373 | 3915, 374 | 3921, 375 | 3924, 376 | 3931, 377 | 3943, 378 | 3956, 379 | 3976, 380 | 3978, 381 | 3987, 382 | 3994, 383 | 4001, 384 | 4004, 385 | 4005, 386 | 4009, 387 | 4015, 388 | 4020, 389 | 4027, 390 | 4029, 391 | 4056, 392 | 4067, 393 | 4075, 394 | 4092, 395 | 4096, 396 | 4097, 397 | 4100, 398 | 4123, 399 | 4148, 400 | 4157, 401 | 4161, 402 | 4172, 403 | 4179, 404 | 4180, 405 | 4186, 406 | 4191, 407 | 4195, 408 | 4198, 409 | 4213, 410 | 4215, 411 | 4234, 412 | 4240, 413 | 4242, 414 | 4268, 415 | 4270, 416 | 4295, 417 | 4298, 418 | 4353, 419 | 4356, 420 | 4360, 421 | 4381, 422 | 4383, 423 | 4385, 424 | 4398, 425 | 4407, 426 | 4410, 427 | 4414, 428 | 4417, 429 | 4420, 430 | 4421, 431 | 4424, 432 | 4429, 433 | 4447, 434 | 4462, 435 | 4463, 436 | 4465, 437 | 4471, 438 | 4476, 439 | 4484, 440 | 4489, 441 | 4504, 442 | 4512, 443 | 4526, 444 | 4528, 445 | 4542, 446 | 4547, 447 | 4558, 448 | 4570, 449 | 4578, 450 | 4582, 451 | 4586, 452 | 4609, 453 | 4630, 454 | 4633, 455 | 4646, 456 | 4663, 457 | 4664, 458 | 4666, 459 | 4670, 460 | 4674, 461 | 4689, 462 | 4700, 463 | 4712, 464 | 4714, 465 | 4722, 466 | 4757, 467 | 4770, 468 | 4772, 469 | 4781, 470 | 4801, 471 | 4805, 472 | 4807, 473 | 4826, 474 | 4828, 475 | 4830, 476 | 4831, 477 | 4835, 478 | 4838, 479 | 4843, 480 | 4854, 481 | 4863, 482 | 4866, 483 | 4874, 484 | 4880, 485 | 4881, 486 | 4882, 487 | 4885, 488 | 4886, 489 | 4888, 490 | 4891, 491 | 4910, 492 | 4914, 493 | 4920, 494 | 4927, 495 | 4938, 496 | 4944, 497 | 4954, 498 | 4956, 499 | 4960, 500 | 4962, 501 | 4972, 502 | 4974, 503 | 4975, 504 | 4998, 505 | 5010, 506 | 5013, 507 | 5015, 508 | 5018, 509 | 5021, 510 | 5026, 511 | 5034, 512 | 5036, 513 | 5040, 514 | 5043, 515 | 5053, 516 | 5060, 517 | 5069, 518 | 5076, 519 | 5080, 520 | 5095, 521 | 5098 522 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/freelaw/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 9, 3 | 20, 4 | 24, 5 | 40, 6 | 65, 7 | 69, 8 | 75, 9 | 98, 10 | 100, 11 | 107, 12 | 113, 13 | 122, 14 | 123, 15 | 189, 16 | 208, 17 | 220, 18 | 230, 19 | 236, 20 | 245, 21 | 253, 22 | 263, 23 | 266, 24 | 291, 25 | 299, 26 | 302, 27 | 324, 28 | 328, 29 | 336, 30 | 339, 31 | 345, 32 | 356, 33 | 361, 34 | 370, 35 | 374, 36 | 431, 37 | 433, 38 | 436, 39 | 462, 40 | 479, 41 | 486, 42 | 490, 43 | 502, 44 | 505, 45 | 515, 46 | 529, 47 | 537, 48 | 544, 49 | 555, 50 | 577, 51 | 606, 52 | 617, 53 | 622, 54 | 623, 55 | 630, 56 | 632, 57 | 697, 58 | 731, 59 | 737, 60 | 744, 61 | 756, 62 | 778, 63 | 795, 64 | 801, 65 | 835, 66 | 836, 67 | 847, 68 | 868, 69 | 888, 70 | 889, 71 | 903, 72 | 906, 73 | 908, 74 | 918, 75 | 952, 76 | 959, 77 | 965, 78 | 983, 79 | 984, 80 | 986, 81 | 990, 82 | 1008, 83 | 1022, 84 | 1039, 85 | 1040, 86 | 1051, 87 | 1055, 88 | 1059, 89 | 1067, 90 | 1092, 91 | 1104, 92 | 1109, 93 | 1110, 94 | 1112, 95 | 1138, 96 | 1174, 97 | 1181, 98 | 1183, 99 | 1187, 100 | 1200, 101 | 1209, 102 | 1269, 103 | 1278, 104 | 1283, 105 | 1323, 106 | 1326, 107 | 1331, 108 | 1342, 109 | 1354, 110 | 1361, 111 | 1363, 112 | 1385, 113 | 1387, 114 | 1392, 115 | 1404, 116 | 1430, 117 | 1433, 118 | 1438, 119 | 1439, 120 | 1452, 121 | 1456, 122 | 1469, 123 | 1475, 124 | 1489, 125 | 1490, 126 | 1500, 127 | 1502, 128 | 1509, 129 | 1516, 130 | 1520, 131 | 1538, 132 | 1543, 133 | 1546, 134 | 1548, 135 | 1551, 136 | 1561, 137 | 1568, 138 | 1569, 139 | 1572, 140 | 1581, 141 | 1586, 142 | 1592, 143 | 1599, 144 | 1610, 145 | 1612, 146 | 1637, 147 | 1650, 148 | 1651, 149 | 1654, 150 | 1672, 151 | 1694, 152 | 1697, 153 | 1716, 154 | 1723, 155 | 1726, 156 | 1747, 157 | 1752, 158 | 1755, 159 | 1756, 160 | 1770, 161 | 1781, 162 | 1782, 163 | 1784, 164 | 1790, 165 | 1804, 166 | 1818, 167 | 1820, 168 | 1838, 169 | 1851, 170 | 1875, 171 | 1907, 172 | 1918, 173 | 1925, 174 | 1929, 175 | 1964, 176 | 1965, 177 | 1968, 178 | 1970, 179 | 1973, 180 | 1974, 181 | 1979, 182 | 1981, 183 | 1988, 184 | 1993, 185 | 2002, 186 | 2010, 187 | 2024, 188 | 2027, 189 | 2041, 190 | 2046, 191 | 2051, 192 | 2052, 193 | 2073, 194 | 2077, 195 | 2080, 196 | 2094, 197 | 2104, 198 | 2110, 199 | 2128, 200 | 2131, 201 | 2156, 202 | 2176, 203 | 2178, 204 | 2181, 205 | 2215, 206 | 2226, 207 | 2232, 208 | 2238, 209 | 2240, 210 | 2264, 211 | 2292, 212 | 2296, 213 | 2299, 214 | 2300, 215 | 2303, 216 | 2307, 217 | 2309, 218 | 2319, 219 | 2323, 220 | 2334, 221 | 2347, 222 | 2365, 223 | 2370, 224 | 2377, 225 | 2382, 226 | 2400, 227 | 2421, 228 | 2427, 229 | 2430, 230 | 2433, 231 | 2454, 232 | 2455, 233 | 2460, 234 | 2461, 235 | 2477, 236 | 2485, 237 | 2490, 238 | 2493, 239 | 2504, 240 | 2515, 241 | 2516, 242 | 2518, 243 | 2528, 244 | 2530, 245 | 2532, 246 | 2538, 247 | 2540, 248 | 2542, 249 | 2543, 250 | 2547, 251 | 2561, 252 | 2626, 253 | 2630, 254 | 2642, 255 | 2656, 256 | 2664, 257 | 2685, 258 | 2693, 259 | 2697, 260 | 2700, 261 | 2713, 262 | 2726, 263 | 2729, 264 | 2733, 265 | 2754, 266 | 2763, 267 | 2777, 268 | 2809, 269 | 2810, 270 | 2815, 271 | 2846, 272 | 2858, 273 | 2865, 274 | 2878, 275 | 2881, 276 | 2907, 277 | 2915, 278 | 2918, 279 | 2922, 280 | 2931, 281 | 2944, 282 | 2968, 283 | 2973, 284 | 2985, 285 | 2986, 286 | 2990, 287 | 2995, 288 | 3000, 289 | 3018, 290 | 3037, 291 | 3044, 292 | 3045, 293 | 3072, 294 | 3076, 295 | 3097, 296 | 3103, 297 | 3104, 298 | 3120, 299 | 3121, 300 | 3128, 301 | 3129, 302 | 3130, 303 | 3148, 304 | 3188, 305 | 3200, 306 | 3213, 307 | 3214, 308 | 3220, 309 | 3226, 310 | 3237, 311 | 3238, 312 | 3266, 313 | 3270, 314 | 3280, 315 | 3281, 316 | 3287, 317 | 3291, 318 | 3292, 319 | 3301, 320 | 3313, 321 | 3318, 322 | 3326, 323 | 3333, 324 | 3339, 325 | 3350, 326 | 3351, 327 | 3371, 328 | 3373, 329 | 3379, 330 | 3391, 331 | 3412, 332 | 3419, 333 | 3426, 334 | 3429, 335 | 3452, 336 | 3460, 337 | 3462, 338 | 3480, 339 | 3483, 340 | 3489, 341 | 3491, 342 | 3499, 343 | 3506, 344 | 3514, 345 | 3537, 346 | 3558, 347 | 3563, 348 | 3566, 349 | 3567, 350 | 3578, 351 | 3595, 352 | 3606, 353 | 3610, 354 | 3620, 355 | 3629, 356 | 3633, 357 | 3645, 358 | 3679, 359 | 3707, 360 | 3743, 361 | 3757, 362 | 3764, 363 | 3776, 364 | 3800, 365 | 3831, 366 | 3832, 367 | 3834, 368 | 3850, 369 | 3865, 370 | 3882, 371 | 3887, 372 | 3898, 373 | 3902, 374 | 3918, 375 | 3930, 376 | 3939, 377 | 3940, 378 | 3946, 379 | 3953, 380 | 3961, 381 | 3966, 382 | 3973, 383 | 3975, 384 | 3977, 385 | 3984, 386 | 3988, 387 | 3989, 388 | 3999, 389 | 4002, 390 | 4022, 391 | 4031, 392 | 4047, 393 | 4052, 394 | 4066, 395 | 4080, 396 | 4101, 397 | 4115, 398 | 4125, 399 | 4136, 400 | 4167, 401 | 4173, 402 | 4183, 403 | 4205, 404 | 4207, 405 | 4208, 406 | 4211, 407 | 4214, 408 | 4228, 409 | 4246, 410 | 4256, 411 | 4257, 412 | 4261, 413 | 4273, 414 | 4286, 415 | 4299, 416 | 4302, 417 | 4309, 418 | 4313, 419 | 4318, 420 | 4328, 421 | 4332, 422 | 4338, 423 | 4340, 424 | 4344, 425 | 4349, 426 | 4365, 427 | 4374, 428 | 4394, 429 | 4399, 430 | 4408, 431 | 4409, 432 | 4434, 433 | 4441, 434 | 4470, 435 | 4473, 436 | 4490, 437 | 4491, 438 | 4500, 439 | 4516, 440 | 4520, 441 | 4524, 442 | 4534, 443 | 4567, 444 | 4574, 445 | 4577, 446 | 4589, 447 | 4626, 448 | 4632, 449 | 4639, 450 | 4658, 451 | 4662, 452 | 4684, 453 | 4701, 454 | 4718, 455 | 4728, 456 | 4763, 457 | 4780, 458 | 4786, 459 | 4791, 460 | 4802, 461 | 4806, 462 | 4818, 463 | 4833, 464 | 4836, 465 | 4850, 466 | 4852, 467 | 4862, 468 | 4877, 469 | 4892, 470 | 4905, 471 | 4918, 472 | 4951, 473 | 4957, 474 | 4976, 475 | 5012, 476 | 5022, 477 | 5028, 478 | 5068, 479 | 5070, 480 | 5077, 481 | 5093 482 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/freelaw/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 2, 4 | 17, 5 | 18, 6 | 28, 7 | 41, 8 | 44, 9 | 45, 10 | 47, 11 | 48, 12 | 73, 13 | 82, 14 | 84, 15 | 105, 16 | 125, 17 | 129, 18 | 134, 19 | 151, 20 | 153, 21 | 155, 22 | 157, 23 | 163, 24 | 178, 25 | 180, 26 | 184, 27 | 187, 28 | 216, 29 | 219, 30 | 222, 31 | 241, 32 | 246, 33 | 278, 34 | 280, 35 | 288, 36 | 289, 37 | 325, 38 | 327, 39 | 331, 40 | 335, 41 | 346, 42 | 366, 43 | 369, 44 | 378, 45 | 379, 46 | 390, 47 | 393, 48 | 400, 49 | 414, 50 | 422, 51 | 423, 52 | 434, 53 | 437, 54 | 444, 55 | 452, 56 | 457, 57 | 471, 58 | 489, 59 | 497, 60 | 508, 61 | 510, 62 | 514, 63 | 521, 64 | 546, 65 | 560, 66 | 569, 67 | 570, 68 | 573, 69 | 600, 70 | 611, 71 | 631, 72 | 636, 73 | 637, 74 | 652, 75 | 659, 76 | 663, 77 | 675, 78 | 692, 79 | 699, 80 | 706, 81 | 708, 82 | 733, 83 | 735, 84 | 738, 85 | 746, 86 | 751, 87 | 761, 88 | 765, 89 | 777, 90 | 779, 91 | 785, 92 | 791, 93 | 802, 94 | 806, 95 | 816, 96 | 826, 97 | 827, 98 | 858, 99 | 860, 100 | 861, 101 | 864, 102 | 894, 103 | 899, 104 | 919, 105 | 960, 106 | 972, 107 | 974, 108 | 982, 109 | 998, 110 | 999, 111 | 1014, 112 | 1032, 113 | 1038, 114 | 1047, 115 | 1058, 116 | 1069, 117 | 1080, 118 | 1087, 119 | 1089, 120 | 1090, 121 | 1096, 122 | 1099, 123 | 1108, 124 | 1135, 125 | 1142, 126 | 1158, 127 | 1161, 128 | 1168, 129 | 1170, 130 | 1180, 131 | 1182, 132 | 1196, 133 | 1208, 134 | 1211, 135 | 1213, 136 | 1222, 137 | 1235, 138 | 1243, 139 | 1248, 140 | 1260, 141 | 1272, 142 | 1276, 143 | 1284, 144 | 1289, 145 | 1295, 146 | 1316, 147 | 1330, 148 | 1334, 149 | 1336, 150 | 1339, 151 | 1365, 152 | 1367, 153 | 1368, 154 | 1373, 155 | 1399, 156 | 1402, 157 | 1414, 158 | 1424, 159 | 1442, 160 | 1457, 161 | 1462, 162 | 1463, 163 | 1468, 164 | 1470, 165 | 1486, 166 | 1493, 167 | 1511, 168 | 1519, 169 | 1533, 170 | 1539, 171 | 1547, 172 | 1555, 173 | 1557, 174 | 1563, 175 | 1564, 176 | 1565, 177 | 1578, 178 | 1588, 179 | 1601, 180 | 1626, 181 | 1657, 182 | 1658, 183 | 1680, 184 | 1685, 185 | 1688, 186 | 1690, 187 | 1695, 188 | 1700, 189 | 1705, 190 | 1718, 191 | 1727, 192 | 1734, 193 | 1738, 194 | 1739, 195 | 1745, 196 | 1764, 197 | 1773, 198 | 1788, 199 | 1806, 200 | 1849, 201 | 1850, 202 | 1856, 203 | 1858, 204 | 1865, 205 | 1867, 206 | 1883, 207 | 1885, 208 | 1909, 209 | 1913, 210 | 1947, 211 | 1958, 212 | 1984, 213 | 1990, 214 | 1998, 215 | 2009, 216 | 2011, 217 | 2012, 218 | 2021, 219 | 2026, 220 | 2037, 221 | 2043, 222 | 2050, 223 | 2054, 224 | 2055, 225 | 2059, 226 | 2061, 227 | 2065, 228 | 2078, 229 | 2081, 230 | 2084, 231 | 2101, 232 | 2102, 233 | 2109, 234 | 2118, 235 | 2134, 236 | 2151, 237 | 2162, 238 | 2185, 239 | 2210, 240 | 2216, 241 | 2233, 242 | 2243, 243 | 2250, 244 | 2259, 245 | 2270, 246 | 2278, 247 | 2286, 248 | 2288, 249 | 2291, 250 | 2305, 251 | 2314, 252 | 2327, 253 | 2339, 254 | 2341, 255 | 2348, 256 | 2355, 257 | 2363, 258 | 2369, 259 | 2380, 260 | 2398, 261 | 2429, 262 | 2431, 263 | 2452, 264 | 2464, 265 | 2474, 266 | 2479, 267 | 2482, 268 | 2489, 269 | 2492, 270 | 2495, 271 | 2497, 272 | 2502, 273 | 2505, 274 | 2524, 275 | 2531, 276 | 2541, 277 | 2544, 278 | 2545, 279 | 2573, 280 | 2583, 281 | 2635, 282 | 2643, 283 | 2660, 284 | 2671, 285 | 2673, 286 | 2677, 287 | 2710, 288 | 2728, 289 | 2731, 290 | 2735, 291 | 2737, 292 | 2741, 293 | 2745, 294 | 2753, 295 | 2761, 296 | 2762, 297 | 2793, 298 | 2796, 299 | 2798, 300 | 2805, 301 | 2835, 302 | 2840, 303 | 2844, 304 | 2851, 305 | 2875, 306 | 2891, 307 | 2898, 308 | 2906, 309 | 2911, 310 | 2921, 311 | 2932, 312 | 2941, 313 | 2947, 314 | 2950, 315 | 2953, 316 | 2972, 317 | 2978, 318 | 2982, 319 | 2984, 320 | 2994, 321 | 3002, 322 | 3003, 323 | 3017, 324 | 3026, 325 | 3039, 326 | 3043, 327 | 3049, 328 | 3094, 329 | 3108, 330 | 3110, 331 | 3127, 332 | 3131, 333 | 3154, 334 | 3180, 335 | 3189, 336 | 3192, 337 | 3216, 338 | 3217, 339 | 3227, 340 | 3233, 341 | 3240, 342 | 3250, 343 | 3258, 344 | 3267, 345 | 3275, 346 | 3276, 347 | 3300, 348 | 3304, 349 | 3328, 350 | 3331, 351 | 3345, 352 | 3355, 353 | 3369, 354 | 3376, 355 | 3386, 356 | 3390, 357 | 3394, 358 | 3399, 359 | 3444, 360 | 3448, 361 | 3473, 362 | 3477, 363 | 3484, 364 | 3494, 365 | 3496, 366 | 3503, 367 | 3507, 368 | 3557, 369 | 3564, 370 | 3590, 371 | 3603, 372 | 3616, 373 | 3623, 374 | 3635, 375 | 3636, 376 | 3638, 377 | 3640, 378 | 3647, 379 | 3649, 380 | 3665, 381 | 3668, 382 | 3680, 383 | 3702, 384 | 3704, 385 | 3705, 386 | 3711, 387 | 3714, 388 | 3749, 389 | 3752, 390 | 3753, 391 | 3754, 392 | 3759, 393 | 3766, 394 | 3775, 395 | 3785, 396 | 3801, 397 | 3820, 398 | 3829, 399 | 3835, 400 | 3840, 401 | 3842, 402 | 3844, 403 | 3849, 404 | 3859, 405 | 3875, 406 | 3905, 407 | 3906, 408 | 3911, 409 | 3929, 410 | 3941, 411 | 3951, 412 | 3959, 413 | 3968, 414 | 3970, 415 | 4003, 416 | 4006, 417 | 4019, 418 | 4028, 419 | 4083, 420 | 4149, 421 | 4153, 422 | 4155, 423 | 4168, 424 | 4187, 425 | 4193, 426 | 4203, 427 | 4209, 428 | 4217, 429 | 4219, 430 | 4222, 431 | 4238, 432 | 4272, 433 | 4277, 434 | 4300, 435 | 4305, 436 | 4308, 437 | 4324, 438 | 4334, 439 | 4341, 440 | 4345, 441 | 4357, 442 | 4358, 443 | 4359, 444 | 4363, 445 | 4373, 446 | 4393, 447 | 4397, 448 | 4403, 449 | 4416, 450 | 4451, 451 | 4452, 452 | 4456, 453 | 4459, 454 | 4478, 455 | 4479, 456 | 4480, 457 | 4486, 458 | 4495, 459 | 4498, 460 | 4511, 461 | 4545, 462 | 4555, 463 | 4565, 464 | 4568, 465 | 4573, 466 | 4584, 467 | 4590, 468 | 4607, 469 | 4610, 470 | 4623, 471 | 4647, 472 | 4656, 473 | 4671, 474 | 4672, 475 | 4682, 476 | 4685, 477 | 4724, 478 | 4727, 479 | 4750, 480 | 4754, 481 | 4764, 482 | 4771, 483 | 4773, 484 | 4787, 485 | 4792, 486 | 4794, 487 | 4825, 488 | 4837, 489 | 4840, 490 | 4845, 491 | 4846, 492 | 4848, 493 | 4857, 494 | 4864, 495 | 4872, 496 | 4887, 497 | 4890, 498 | 4897, 499 | 4898, 500 | 4901, 501 | 4917, 502 | 4929, 503 | 4942, 504 | 4952, 505 | 4965, 506 | 4981, 507 | 4991, 508 | 5001, 509 | 5007, 510 | 5014, 511 | 5025, 512 | 5046, 513 | 5047, 514 | 5052, 515 | 5055, 516 | 5075, 517 | 5081, 518 | 5085, 519 | 5091 520 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/freelaw/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 14, 3 | 15, 4 | 19, 5 | 27, 6 | 42, 7 | 52, 8 | 60, 9 | 72, 10 | 78, 11 | 91, 12 | 116, 13 | 121, 14 | 141, 15 | 168, 16 | 182, 17 | 185, 18 | 193, 19 | 204, 20 | 209, 21 | 224, 22 | 229, 23 | 232, 24 | 255, 25 | 272, 26 | 293, 27 | 308, 28 | 311, 29 | 322, 30 | 326, 31 | 342, 32 | 363, 33 | 376, 34 | 389, 35 | 399, 36 | 407, 37 | 419, 38 | 420, 39 | 421, 40 | 426, 41 | 428, 42 | 430, 43 | 439, 44 | 456, 45 | 477, 46 | 518, 47 | 526, 48 | 541, 49 | 550, 50 | 551, 51 | 557, 52 | 578, 53 | 581, 54 | 602, 55 | 607, 56 | 610, 57 | 661, 58 | 673, 59 | 686, 60 | 687, 61 | 696, 62 | 711, 63 | 712, 64 | 713, 65 | 718, 66 | 734, 67 | 739, 68 | 748, 69 | 771, 70 | 773, 71 | 790, 72 | 794, 73 | 810, 74 | 821, 75 | 824, 76 | 825, 77 | 830, 78 | 832, 79 | 837, 80 | 842, 81 | 855, 82 | 865, 83 | 869, 84 | 892, 85 | 895, 86 | 896, 87 | 898, 88 | 909, 89 | 926, 90 | 942, 91 | 945, 92 | 953, 93 | 957, 94 | 958, 95 | 963, 96 | 992, 97 | 997, 98 | 1001, 99 | 1013, 100 | 1033, 101 | 1036, 102 | 1037, 103 | 1062, 104 | 1076, 105 | 1081, 106 | 1097, 107 | 1106, 108 | 1118, 109 | 1121, 110 | 1125, 111 | 1136, 112 | 1153, 113 | 1155, 114 | 1162, 115 | 1179, 116 | 1185, 117 | 1194, 118 | 1198, 119 | 1199, 120 | 1201, 121 | 1204, 122 | 1205, 123 | 1207, 124 | 1218, 125 | 1220, 126 | 1229, 127 | 1247, 128 | 1255, 129 | 1256, 130 | 1264, 131 | 1268, 132 | 1285, 133 | 1291, 134 | 1304, 135 | 1305, 136 | 1333, 137 | 1350, 138 | 1356, 139 | 1372, 140 | 1381, 141 | 1388, 142 | 1391, 143 | 1394, 144 | 1412, 145 | 1416, 146 | 1444, 147 | 1460, 148 | 1472, 149 | 1477, 150 | 1495, 151 | 1497, 152 | 1504, 153 | 1510, 154 | 1513, 155 | 1518, 156 | 1526, 157 | 1530, 158 | 1531, 159 | 1534, 160 | 1544, 161 | 1550, 162 | 1573, 163 | 1574, 164 | 1575, 165 | 1576, 166 | 1579, 167 | 1591, 168 | 1596, 169 | 1605, 170 | 1656, 171 | 1661, 172 | 1664, 173 | 1693, 174 | 1698, 175 | 1708, 176 | 1709, 177 | 1714, 178 | 1720, 179 | 1731, 180 | 1746, 181 | 1751, 182 | 1774, 183 | 1785, 184 | 1821, 185 | 1822, 186 | 1828, 187 | 1836, 188 | 1840, 189 | 1843, 190 | 1848, 191 | 1853, 192 | 1871, 193 | 1880, 194 | 1881, 195 | 1887, 196 | 1894, 197 | 1898, 198 | 1901, 199 | 1904, 200 | 1923, 201 | 1930, 202 | 1931, 203 | 1932, 204 | 1937, 205 | 1960, 206 | 1971, 207 | 1978, 208 | 1985, 209 | 1986, 210 | 1999, 211 | 2000, 212 | 2028, 213 | 2034, 214 | 2048, 215 | 2049, 216 | 2053, 217 | 2072, 218 | 2095, 219 | 2108, 220 | 2117, 221 | 2119, 222 | 2125, 223 | 2139, 224 | 2140, 225 | 2141, 226 | 2160, 227 | 2170, 228 | 2186, 229 | 2196, 230 | 2200, 231 | 2221, 232 | 2224, 233 | 2229, 234 | 2244, 235 | 2256, 236 | 2260, 237 | 2266, 238 | 2267, 239 | 2274, 240 | 2280, 241 | 2285, 242 | 2289, 243 | 2293, 244 | 2315, 245 | 2317, 246 | 2328, 247 | 2331, 248 | 2345, 249 | 2354, 250 | 2366, 251 | 2367, 252 | 2384, 253 | 2389, 254 | 2396, 255 | 2401, 256 | 2412, 257 | 2413, 258 | 2415, 259 | 2441, 260 | 2444, 261 | 2453, 262 | 2457, 263 | 2472, 264 | 2507, 265 | 2520, 266 | 2525, 267 | 2551, 268 | 2565, 269 | 2585, 270 | 2602, 271 | 2615, 272 | 2619, 273 | 2622, 274 | 2646, 275 | 2674, 276 | 2681, 277 | 2687, 278 | 2695, 279 | 2703, 280 | 2734, 281 | 2736, 282 | 2740, 283 | 2752, 284 | 2758, 285 | 2765, 286 | 2768, 287 | 2778, 288 | 2786, 289 | 2788, 290 | 2790, 291 | 2827, 292 | 2839, 293 | 2843, 294 | 2852, 295 | 2869, 296 | 2872, 297 | 2873, 298 | 2879, 299 | 2886, 300 | 2890, 301 | 2892, 302 | 2903, 303 | 2909, 304 | 2914, 305 | 2923, 306 | 2925, 307 | 2928, 308 | 2945, 309 | 2962, 310 | 2966, 311 | 2974, 312 | 2987, 313 | 2988, 314 | 2993, 315 | 3004, 316 | 3009, 317 | 3032, 318 | 3034, 319 | 3069, 320 | 3087, 321 | 3091, 322 | 3122, 323 | 3142, 324 | 3149, 325 | 3150, 326 | 3151, 327 | 3160, 328 | 3175, 329 | 3196, 330 | 3201, 331 | 3212, 332 | 3215, 333 | 3221, 334 | 3223, 335 | 3232, 336 | 3247, 337 | 3272, 338 | 3274, 339 | 3290, 340 | 3293, 341 | 3298, 342 | 3303, 343 | 3316, 344 | 3324, 345 | 3327, 346 | 3335, 347 | 3338, 348 | 3342, 349 | 3344, 350 | 3356, 351 | 3374, 352 | 3387, 353 | 3388, 354 | 3397, 355 | 3403, 356 | 3404, 357 | 3406, 358 | 3422, 359 | 3438, 360 | 3441, 361 | 3443, 362 | 3454, 363 | 3459, 364 | 3469, 365 | 3475, 366 | 3502, 367 | 3510, 368 | 3538, 369 | 3540, 370 | 3541, 371 | 3545, 372 | 3549, 373 | 3576, 374 | 3589, 375 | 3601, 376 | 3608, 377 | 3625, 378 | 3639, 379 | 3641, 380 | 3671, 381 | 3674, 382 | 3675, 383 | 3682, 384 | 3686, 385 | 3706, 386 | 3718, 387 | 3724, 388 | 3725, 389 | 3736, 390 | 3744, 391 | 3755, 392 | 3774, 393 | 3780, 394 | 3791, 395 | 3799, 396 | 3818, 397 | 3826, 398 | 3828, 399 | 3833, 400 | 3838, 401 | 3843, 402 | 3878, 403 | 3880, 404 | 3932, 405 | 3945, 406 | 4000, 407 | 4017, 408 | 4046, 409 | 4049, 410 | 4059, 411 | 4061, 412 | 4070, 413 | 4077, 414 | 4079, 415 | 4084, 416 | 4086, 417 | 4094, 418 | 4110, 419 | 4118, 420 | 4156, 421 | 4163, 422 | 4166, 423 | 4189, 424 | 4192, 425 | 4196, 426 | 4218, 427 | 4239, 428 | 4283, 429 | 4291, 430 | 4304, 431 | 4317, 432 | 4326, 433 | 4333, 434 | 4337, 435 | 4355, 436 | 4362, 437 | 4375, 438 | 4382, 439 | 4389, 440 | 4391, 441 | 4395, 442 | 4396, 443 | 4402, 444 | 4404, 445 | 4444, 446 | 4483, 447 | 4506, 448 | 4508, 449 | 4514, 450 | 4550, 451 | 4553, 452 | 4557, 453 | 4561, 454 | 4566, 455 | 4572, 456 | 4599, 457 | 4602, 458 | 4608, 459 | 4616, 460 | 4619, 461 | 4622, 462 | 4625, 463 | 4631, 464 | 4635, 465 | 4636, 466 | 4638, 467 | 4640, 468 | 4642, 469 | 4645, 470 | 4657, 471 | 4698, 472 | 4707, 473 | 4710, 474 | 4736, 475 | 4738, 476 | 4741, 477 | 4742, 478 | 4747, 479 | 4762, 480 | 4776, 481 | 4784, 482 | 4789, 483 | 4803, 484 | 4811, 485 | 4814, 486 | 4821, 487 | 4847, 488 | 4853, 489 | 4860, 490 | 4870, 491 | 4902, 492 | 4903, 493 | 4912, 494 | 4924, 495 | 4930, 496 | 4934, 497 | 4943, 498 | 4946, 499 | 4961, 500 | 4983, 501 | 4984, 502 | 4987, 503 | 5032, 504 | 5041, 505 | 5044, 506 | 5045, 507 | 5050, 508 | 5054, 509 | 5057, 510 | 5066, 511 | 5092, 512 | 5097, 513 | 5099 514 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/freelaw/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 31, 4 | 49, 5 | 50, 6 | 53, 7 | 56, 8 | 64, 9 | 67, 10 | 74, 11 | 79, 12 | 89, 13 | 112, 14 | 120, 15 | 130, 16 | 133, 17 | 152, 18 | 160, 19 | 169, 20 | 174, 21 | 215, 22 | 244, 23 | 248, 24 | 252, 25 | 256, 26 | 259, 27 | 264, 28 | 265, 29 | 267, 30 | 268, 31 | 270, 32 | 298, 33 | 304, 34 | 306, 35 | 312, 36 | 347, 37 | 362, 38 | 377, 39 | 382, 40 | 386, 41 | 394, 42 | 403, 43 | 416, 44 | 447, 45 | 459, 46 | 461, 47 | 470, 48 | 475, 49 | 484, 50 | 491, 51 | 494, 52 | 495, 53 | 498, 54 | 499, 55 | 500, 56 | 507, 57 | 513, 58 | 525, 59 | 527, 60 | 543, 61 | 545, 62 | 559, 63 | 565, 64 | 571, 65 | 579, 66 | 583, 67 | 585, 68 | 604, 69 | 615, 70 | 616, 71 | 621, 72 | 624, 73 | 625, 74 | 628, 75 | 638, 76 | 639, 77 | 646, 78 | 649, 79 | 654, 80 | 658, 81 | 667, 82 | 677, 83 | 678, 84 | 694, 85 | 710, 86 | 727, 87 | 747, 88 | 753, 89 | 758, 90 | 767, 91 | 768, 92 | 776, 93 | 780, 94 | 805, 95 | 819, 96 | 820, 97 | 845, 98 | 849, 99 | 857, 100 | 902, 101 | 912, 102 | 921, 103 | 933, 104 | 934, 105 | 935, 106 | 937, 107 | 951, 108 | 962, 109 | 979, 110 | 991, 111 | 994, 112 | 1005, 113 | 1016, 114 | 1025, 115 | 1029, 116 | 1049, 117 | 1052, 118 | 1063, 119 | 1064, 120 | 1072, 121 | 1073, 122 | 1074, 123 | 1113, 124 | 1119, 125 | 1137, 126 | 1147, 127 | 1157, 128 | 1164, 129 | 1216, 130 | 1217, 131 | 1223, 132 | 1226, 133 | 1227, 134 | 1232, 135 | 1298, 136 | 1312, 137 | 1317, 138 | 1321, 139 | 1324, 140 | 1325, 141 | 1335, 142 | 1338, 143 | 1353, 144 | 1371, 145 | 1377, 146 | 1378, 147 | 1386, 148 | 1395, 149 | 1409, 150 | 1413, 151 | 1419, 152 | 1421, 153 | 1435, 154 | 1450, 155 | 1451, 156 | 1488, 157 | 1503, 158 | 1545, 159 | 1559, 160 | 1560, 161 | 1593, 162 | 1597, 163 | 1625, 164 | 1635, 165 | 1640, 166 | 1648, 167 | 1649, 168 | 1659, 169 | 1692, 170 | 1713, 171 | 1725, 172 | 1742, 173 | 1758, 174 | 1761, 175 | 1769, 176 | 1777, 177 | 1787, 178 | 1791, 179 | 1794, 180 | 1807, 181 | 1815, 182 | 1817, 183 | 1826, 184 | 1829, 185 | 1832, 186 | 1847, 187 | 1854, 188 | 1863, 189 | 1869, 190 | 1882, 191 | 1893, 192 | 1900, 193 | 1911, 194 | 1916, 195 | 1921, 196 | 1926, 197 | 1928, 198 | 1933, 199 | 1940, 200 | 1949, 201 | 1952, 202 | 1956, 203 | 1995, 204 | 2019, 205 | 2022, 206 | 2036, 207 | 2062, 208 | 2064, 209 | 2090, 210 | 2111, 211 | 2115, 212 | 2122, 213 | 2127, 214 | 2137, 215 | 2148, 216 | 2152, 217 | 2158, 218 | 2177, 219 | 2191, 220 | 2192, 221 | 2193, 222 | 2207, 223 | 2231, 224 | 2234, 225 | 2239, 226 | 2242, 227 | 2245, 228 | 2254, 229 | 2282, 230 | 2283, 231 | 2284, 232 | 2311, 233 | 2340, 234 | 2356, 235 | 2362, 236 | 2368, 237 | 2373, 238 | 2386, 239 | 2388, 240 | 2417, 241 | 2420, 242 | 2432, 243 | 2437, 244 | 2438, 245 | 2440, 246 | 2478, 247 | 2494, 248 | 2514, 249 | 2523, 250 | 2526, 251 | 2533, 252 | 2553, 253 | 2554, 254 | 2555, 255 | 2566, 256 | 2570, 257 | 2578, 258 | 2590, 259 | 2594, 260 | 2595, 261 | 2599, 262 | 2609, 263 | 2610, 264 | 2614, 265 | 2623, 266 | 2627, 267 | 2633, 268 | 2654, 269 | 2665, 270 | 2666, 271 | 2686, 272 | 2689, 273 | 2690, 274 | 2708, 275 | 2714, 276 | 2718, 277 | 2738, 278 | 2742, 279 | 2747, 280 | 2750, 281 | 2751, 282 | 2773, 283 | 2781, 284 | 2783, 285 | 2784, 286 | 2797, 287 | 2806, 288 | 2811, 289 | 2818, 290 | 2830, 291 | 2850, 292 | 2857, 293 | 2860, 294 | 2896, 295 | 2899, 296 | 2902, 297 | 2926, 298 | 2934, 299 | 2936, 300 | 2937, 301 | 2952, 302 | 2954, 303 | 2955, 304 | 2957, 305 | 2960, 306 | 2979, 307 | 2998, 308 | 3019, 309 | 3021, 310 | 3031, 311 | 3036, 312 | 3040, 313 | 3048, 314 | 3062, 315 | 3083, 316 | 3086, 317 | 3109, 318 | 3126, 319 | 3134, 320 | 3139, 321 | 3146, 322 | 3171, 323 | 3174, 324 | 3185, 325 | 3191, 326 | 3198, 327 | 3206, 328 | 3244, 329 | 3262, 330 | 3279, 331 | 3320, 332 | 3330, 333 | 3334, 334 | 3341, 335 | 3346, 336 | 3348, 337 | 3360, 338 | 3362, 339 | 3365, 340 | 3366, 341 | 3370, 342 | 3383, 343 | 3413, 344 | 3415, 345 | 3416, 346 | 3433, 347 | 3439, 348 | 3447, 349 | 3464, 350 | 3468, 351 | 3492, 352 | 3501, 353 | 3505, 354 | 3520, 355 | 3526, 356 | 3533, 357 | 3535, 358 | 3536, 359 | 3542, 360 | 3569, 361 | 3573, 362 | 3580, 363 | 3602, 364 | 3624, 365 | 3628, 366 | 3646, 367 | 3655, 368 | 3660, 369 | 3661, 370 | 3678, 371 | 3684, 372 | 3693, 373 | 3697, 374 | 3708, 375 | 3709, 376 | 3715, 377 | 3722, 378 | 3723, 379 | 3788, 380 | 3795, 381 | 3804, 382 | 3811, 383 | 3814, 384 | 3819, 385 | 3836, 386 | 3857, 387 | 3858, 388 | 3860, 389 | 3868, 390 | 3869, 391 | 3872, 392 | 3891, 393 | 3913, 394 | 3948, 395 | 3949, 396 | 3960, 397 | 3967, 398 | 3971, 399 | 3972, 400 | 3980, 401 | 3992, 402 | 4007, 403 | 4037, 404 | 4051, 405 | 4062, 406 | 4076, 407 | 4082, 408 | 4085, 409 | 4087, 410 | 4089, 411 | 4090, 412 | 4098, 413 | 4105, 414 | 4144, 415 | 4158, 416 | 4159, 417 | 4164, 418 | 4169, 419 | 4178, 420 | 4184, 421 | 4190, 422 | 4201, 423 | 4221, 424 | 4226, 425 | 4235, 426 | 4236, 427 | 4243, 428 | 4247, 429 | 4254, 430 | 4258, 431 | 4275, 432 | 4292, 433 | 4307, 434 | 4319, 435 | 4346, 436 | 4351, 437 | 4352, 438 | 4368, 439 | 4370, 440 | 4379, 441 | 4405, 442 | 4415, 443 | 4423, 444 | 4430, 445 | 4445, 446 | 4469, 447 | 4485, 448 | 4492, 449 | 4503, 450 | 4525, 451 | 4537, 452 | 4541, 453 | 4549, 454 | 4554, 455 | 4576, 456 | 4591, 457 | 4592, 458 | 4596, 459 | 4597, 460 | 4603, 461 | 4615, 462 | 4621, 463 | 4643, 464 | 4677, 465 | 4678, 466 | 4699, 467 | 4708, 468 | 4709, 469 | 4717, 470 | 4720, 471 | 4740, 472 | 4743, 473 | 4749, 474 | 4755, 475 | 4756, 476 | 4759, 477 | 4760, 478 | 4765, 479 | 4793, 480 | 4795, 481 | 4796, 482 | 4797, 483 | 4804, 484 | 4816, 485 | 4827, 486 | 4855, 487 | 4876, 488 | 4893, 489 | 4904, 490 | 4908, 491 | 4921, 492 | 4937, 493 | 4953, 494 | 4959, 495 | 4979, 496 | 4982, 497 | 5003, 498 | 5048, 499 | 5059, 500 | 5067, 501 | 5071, 502 | 5078, 503 | 5088, 504 | 5090 505 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 13, 3 | 20, 4 | 29, 5 | 34, 6 | 44, 7 | 45, 8 | 51, 9 | 52, 10 | 66, 11 | 67, 12 | 70 13 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 16, 4 | 19, 5 | 28, 6 | 33, 7 | 36, 8 | 63, 9 | 64 10 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 10, 4 | 42, 5 | 74 6 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 6, 3 | 12, 4 | 24, 5 | 35, 6 | 49, 7 | 69, 8 | 71 9 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 4, 3 | 7, 4 | 8, 5 | 26, 6 | 31, 7 | 38, 8 | 39, 9 | 40, 10 | 56, 11 | 59, 12 | 60, 13 | 73, 14 | 78, 15 | 79 16 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 25, 4 | 30, 5 | 32, 6 | 48, 7 | 58, 8 | 61, 9 | 72, 10 | 75 11 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 14, 3 | 18, 4 | 22, 5 | 46, 6 | 68, 7 | 76 8 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 5, 3 | 17, 4 | 50, 5 | 54, 6 | 55 7 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 9, 4 | 11, 5 | 21, 6 | 37, 7 | 41, 8 | 43, 9 | 47, 10 | 77 11 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/gutenberg/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 15, 3 | 23, 4 | 27, 5 | 53, 6 | 57, 7 | 62, 8 | 65 9 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 9, 3 | 14, 4 | 22, 5 | 23, 6 | 25, 7 | 36, 8 | 37, 9 | 38, 10 | 43, 11 | 50, 12 | 54, 13 | 79, 14 | 91, 15 | 102, 16 | 116, 17 | 121, 18 | 126, 19 | 133, 20 | 149, 21 | 172, 22 | 173, 23 | 181, 24 | 200, 25 | 216, 26 | 242, 27 | 247, 28 | 271, 29 | 287, 30 | 306, 31 | 311, 32 | 318, 33 | 328, 34 | 351, 35 | 355, 36 | 378, 37 | 381, 38 | 385, 39 | 396, 40 | 401, 41 | 402, 42 | 408, 43 | 422, 44 | 445, 45 | 455, 46 | 475, 47 | 489, 48 | 503, 49 | 504, 50 | 507, 51 | 520, 52 | 525, 53 | 535, 54 | 538, 55 | 539, 56 | 540, 57 | 549, 58 | 582, 59 | 592, 60 | 596, 61 | 602, 62 | 625, 63 | 637, 64 | 639, 65 | 645, 66 | 672, 67 | 680, 68 | 693, 69 | 700, 70 | 709, 71 | 734, 72 | 744, 73 | 756, 74 | 762, 75 | 769, 76 | 780, 77 | 791, 78 | 794, 79 | 813, 80 | 817, 81 | 818, 82 | 838, 83 | 849, 84 | 868, 85 | 885, 86 | 893, 87 | 895, 88 | 902, 89 | 906, 90 | 918, 91 | 924, 92 | 950, 93 | 971, 94 | 987, 95 | 994, 96 | 995, 97 | 996, 98 | 998, 99 | 999, 100 | 1014, 101 | 1015, 102 | 1016, 103 | 1035, 104 | 1039, 105 | 1044, 106 | 1052, 107 | 1053, 108 | 1054, 109 | 1061, 110 | 1067, 111 | 1083, 112 | 1091, 113 | 1107, 114 | 1114, 115 | 1127, 116 | 1128, 117 | 1145, 118 | 1158, 119 | 1167, 120 | 1175, 121 | 1186, 122 | 1211, 123 | 1227, 124 | 1228, 125 | 1238, 126 | 1254, 127 | 1259, 128 | 1263, 129 | 1269, 130 | 1282, 131 | 1298, 132 | 1303, 133 | 1306, 134 | 1338, 135 | 1345, 136 | 1357, 137 | 1378, 138 | 1388, 139 | 1392, 140 | 1395, 141 | 1396, 142 | 1412, 143 | 1424, 144 | 1427, 145 | 1429, 146 | 1460, 147 | 1469, 148 | 1470, 149 | 1471, 150 | 1476, 151 | 1486, 152 | 1489, 153 | 1497, 154 | 1499, 155 | 1517, 156 | 1546, 157 | 1553, 158 | 1557, 159 | 1572, 160 | 1589, 161 | 1596, 162 | 1602, 163 | 1608, 164 | 1612, 165 | 1616, 166 | 1618 167 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 15, 3 | 18, 4 | 24, 5 | 33, 6 | 73, 7 | 74, 8 | 76, 9 | 77, 10 | 83, 11 | 90, 12 | 96, 13 | 99, 14 | 106, 15 | 109, 16 | 150, 17 | 174, 18 | 184, 19 | 188, 20 | 196, 21 | 204, 22 | 206, 23 | 214, 24 | 232, 25 | 245, 26 | 251, 27 | 263, 28 | 267, 29 | 272, 30 | 290, 31 | 294, 32 | 303, 33 | 314, 34 | 323, 35 | 340, 36 | 358, 37 | 410, 38 | 417, 39 | 421, 40 | 438, 41 | 449, 42 | 454, 43 | 464, 44 | 478, 45 | 484, 46 | 492, 47 | 493, 48 | 496, 49 | 502, 50 | 506, 51 | 509, 52 | 510, 53 | 516, 54 | 527, 55 | 529, 56 | 547, 57 | 548, 58 | 550, 59 | 552, 60 | 560, 61 | 565, 62 | 570, 63 | 576, 64 | 597, 65 | 599, 66 | 605, 67 | 616, 68 | 624, 69 | 630, 70 | 631, 71 | 634, 72 | 655, 73 | 704, 74 | 719, 75 | 726, 76 | 735, 77 | 747, 78 | 760, 79 | 766, 80 | 767, 81 | 768, 82 | 788, 83 | 805, 84 | 806, 85 | 808, 86 | 810, 87 | 814, 88 | 819, 89 | 829, 90 | 837, 91 | 842, 92 | 846, 93 | 850, 94 | 851, 95 | 890, 96 | 908, 97 | 921, 98 | 926, 99 | 927, 100 | 941, 101 | 945, 102 | 949, 103 | 966, 104 | 975, 105 | 976, 106 | 986, 107 | 1002, 108 | 1003, 109 | 1009, 110 | 1010, 111 | 1033, 112 | 1049, 113 | 1074, 114 | 1082, 115 | 1086, 116 | 1105, 117 | 1119, 118 | 1138, 119 | 1141, 120 | 1144, 121 | 1165, 122 | 1169, 123 | 1171, 124 | 1182, 125 | 1196, 126 | 1198, 127 | 1200, 128 | 1212, 129 | 1231, 130 | 1237, 131 | 1252, 132 | 1262, 133 | 1270, 134 | 1300, 135 | 1305, 136 | 1314, 137 | 1318, 138 | 1323, 139 | 1328, 140 | 1350, 141 | 1368, 142 | 1377, 143 | 1390, 144 | 1394, 145 | 1397, 146 | 1440, 147 | 1450, 148 | 1491, 149 | 1492, 150 | 1501, 151 | 1521, 152 | 1526, 153 | 1539, 154 | 1540, 155 | 1545, 156 | 1561, 157 | 1563, 158 | 1578, 159 | 1580, 160 | 1587, 161 | 1595, 162 | 1600, 163 | 1609, 164 | 1613, 165 | 1620, 166 | 1623 167 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 29, 4 | 32, 5 | 44, 6 | 100, 7 | 114, 8 | 124, 9 | 130, 10 | 134, 11 | 146, 12 | 152, 13 | 161, 14 | 179, 15 | 180, 16 | 187, 17 | 211, 18 | 228, 19 | 240, 20 | 246, 21 | 249, 22 | 256, 23 | 260, 24 | 283, 25 | 315, 26 | 319, 27 | 334, 28 | 339, 29 | 346, 30 | 356, 31 | 365, 32 | 366, 33 | 389, 34 | 393, 35 | 395, 36 | 398, 37 | 416, 38 | 419, 39 | 435, 40 | 439, 41 | 463, 42 | 469, 43 | 480, 44 | 499, 45 | 500, 46 | 511, 47 | 513, 48 | 514, 49 | 521, 50 | 534, 51 | 543, 52 | 555, 53 | 556, 54 | 558, 55 | 572, 56 | 581, 57 | 583, 58 | 586, 59 | 591, 60 | 604, 61 | 613, 62 | 626, 63 | 628, 64 | 632, 65 | 640, 66 | 644, 67 | 648, 68 | 649, 69 | 658, 70 | 663, 71 | 679, 72 | 688, 73 | 699, 74 | 711, 75 | 716, 76 | 721, 77 | 724, 78 | 738, 79 | 752, 80 | 781, 81 | 801, 82 | 811, 83 | 816, 84 | 832, 85 | 855, 86 | 859, 87 | 865, 88 | 870, 89 | 891, 90 | 899, 91 | 919, 92 | 933, 93 | 951, 94 | 956, 95 | 958, 96 | 965, 97 | 980, 98 | 989, 99 | 993, 100 | 997, 101 | 1000, 102 | 1004, 103 | 1011, 104 | 1096, 105 | 1097, 106 | 1100, 107 | 1104, 108 | 1108, 109 | 1118, 110 | 1134, 111 | 1150, 112 | 1166, 113 | 1201, 114 | 1210, 115 | 1230, 116 | 1235, 117 | 1246, 118 | 1253, 119 | 1260, 120 | 1264, 121 | 1268, 122 | 1295, 123 | 1311, 124 | 1334, 125 | 1340, 126 | 1343, 127 | 1347, 128 | 1348, 129 | 1354, 130 | 1393, 131 | 1402, 132 | 1406, 133 | 1410, 134 | 1411, 135 | 1413, 136 | 1414, 137 | 1415, 138 | 1433, 139 | 1453, 140 | 1472, 141 | 1478, 142 | 1485, 143 | 1493, 144 | 1502, 145 | 1511, 146 | 1527, 147 | 1538, 148 | 1543, 149 | 1544, 150 | 1562, 151 | 1567, 152 | 1575, 153 | 1588, 154 | 1592, 155 | 1601, 156 | 1603 157 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 8, 3 | 10, 4 | 11, 5 | 21, 6 | 31, 7 | 45, 8 | 47, 9 | 58, 10 | 80, 11 | 97, 12 | 127, 13 | 128, 14 | 132, 15 | 136, 16 | 142, 17 | 154, 18 | 156, 19 | 159, 20 | 163, 21 | 170, 22 | 183, 23 | 186, 24 | 193, 25 | 205, 26 | 212, 27 | 239, 28 | 252, 29 | 273, 30 | 284, 31 | 302, 32 | 307, 33 | 312, 34 | 324, 35 | 325, 36 | 335, 37 | 338, 38 | 360, 39 | 380, 40 | 382, 41 | 390, 42 | 441, 43 | 446, 44 | 451, 45 | 457, 46 | 460, 47 | 468, 48 | 472, 49 | 476, 50 | 481, 51 | 486, 52 | 490, 53 | 498, 54 | 501, 55 | 505, 56 | 536, 57 | 537, 58 | 579, 59 | 601, 60 | 609, 61 | 623, 62 | 643, 63 | 650, 64 | 653, 65 | 657, 66 | 660, 67 | 665, 68 | 673, 69 | 674, 70 | 685, 71 | 691, 72 | 702, 73 | 708, 74 | 714, 75 | 722, 76 | 723, 77 | 731, 78 | 736, 79 | 746, 80 | 751, 81 | 758, 82 | 764, 83 | 789, 84 | 827, 85 | 854, 86 | 858, 87 | 862, 88 | 864, 89 | 879, 90 | 911, 91 | 912, 92 | 914, 93 | 932, 94 | 935, 95 | 946, 96 | 947, 97 | 953, 98 | 954, 99 | 955, 100 | 957, 101 | 974, 102 | 1007, 103 | 1026, 104 | 1043, 105 | 1046, 106 | 1051, 107 | 1065, 108 | 1089, 109 | 1090, 110 | 1112, 111 | 1113, 112 | 1137, 113 | 1140, 114 | 1147, 115 | 1148, 116 | 1159, 117 | 1164, 118 | 1179, 119 | 1188, 120 | 1189, 121 | 1191, 122 | 1207, 123 | 1215, 124 | 1226, 125 | 1232, 126 | 1242, 127 | 1244, 128 | 1258, 129 | 1271, 130 | 1276, 131 | 1285, 132 | 1288, 133 | 1294, 134 | 1304, 135 | 1321, 136 | 1327, 137 | 1332, 138 | 1339, 139 | 1341, 140 | 1361, 141 | 1362, 142 | 1364, 143 | 1369, 144 | 1374, 145 | 1381, 146 | 1384, 147 | 1386, 148 | 1389, 149 | 1400, 150 | 1401, 151 | 1420, 152 | 1434, 153 | 1487, 154 | 1509, 155 | 1516, 156 | 1547, 157 | 1548, 158 | 1568, 159 | 1569, 160 | 1570, 161 | 1571, 162 | 1583, 163 | 1599, 164 | 1622, 165 | 1630 166 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 7, 4 | 48, 5 | 61, 6 | 68, 7 | 72, 8 | 75, 9 | 105, 10 | 107, 11 | 108, 12 | 129, 13 | 131, 14 | 140, 15 | 160, 16 | 190, 17 | 191, 18 | 192, 19 | 199, 20 | 208, 21 | 209, 22 | 213, 23 | 227, 24 | 254, 25 | 259, 26 | 261, 27 | 262, 28 | 268, 29 | 270, 30 | 276, 31 | 291, 32 | 292, 33 | 295, 34 | 299, 35 | 329, 36 | 344, 37 | 345, 38 | 348, 39 | 350, 40 | 353, 41 | 362, 42 | 367, 43 | 370, 44 | 375, 45 | 383, 46 | 397, 47 | 400, 48 | 407, 49 | 413, 50 | 425, 51 | 427, 52 | 434, 53 | 442, 54 | 453, 55 | 479, 56 | 482, 57 | 483, 58 | 512, 59 | 523, 60 | 533, 61 | 563, 62 | 573, 63 | 575, 64 | 578, 65 | 585, 66 | 600, 67 | 608, 68 | 621, 69 | 646, 70 | 656, 71 | 669, 72 | 670, 73 | 671, 74 | 681, 75 | 684, 76 | 697, 77 | 718, 78 | 728, 79 | 741, 80 | 771, 81 | 775, 82 | 777, 83 | 782, 84 | 784, 85 | 785, 86 | 786, 87 | 790, 88 | 795, 89 | 797, 90 | 807, 91 | 815, 92 | 820, 93 | 822, 94 | 831, 95 | 835, 96 | 839, 97 | 841, 98 | 844, 99 | 853, 100 | 856, 101 | 903, 102 | 904, 103 | 910, 104 | 917, 105 | 920, 106 | 939, 107 | 944, 108 | 948, 109 | 969, 110 | 981, 111 | 982, 112 | 988, 113 | 1005, 114 | 1006, 115 | 1008, 116 | 1021, 117 | 1028, 118 | 1031, 119 | 1040, 120 | 1055, 121 | 1062, 122 | 1068, 123 | 1069, 124 | 1081, 125 | 1093, 126 | 1099, 127 | 1110, 128 | 1111, 129 | 1120, 130 | 1121, 131 | 1124, 132 | 1149, 133 | 1163, 134 | 1170, 135 | 1187, 136 | 1194, 137 | 1219, 138 | 1222, 139 | 1233, 140 | 1239, 141 | 1241, 142 | 1261, 143 | 1273, 144 | 1291, 145 | 1292, 146 | 1293, 147 | 1296, 148 | 1326, 149 | 1336, 150 | 1337, 151 | 1363, 152 | 1408, 153 | 1409, 154 | 1418, 155 | 1432, 156 | 1438, 157 | 1442, 158 | 1446, 159 | 1449, 160 | 1454, 161 | 1458, 162 | 1465, 163 | 1475, 164 | 1479, 165 | 1505, 166 | 1519, 167 | 1550, 168 | 1551, 169 | 1581, 170 | 1582, 171 | 1584, 172 | 1606, 173 | 1614 174 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 12, 3 | 17, 4 | 30, 5 | 34, 6 | 39, 7 | 40, 8 | 41, 9 | 46, 10 | 49, 11 | 55, 12 | 56, 13 | 63, 14 | 67, 15 | 89, 16 | 103, 17 | 110, 18 | 119, 19 | 145, 20 | 153, 21 | 155, 22 | 162, 23 | 165, 24 | 167, 25 | 168, 26 | 178, 27 | 194, 28 | 197, 29 | 201, 30 | 203, 31 | 217, 32 | 219, 33 | 235, 34 | 248, 35 | 255, 36 | 279, 37 | 300, 38 | 301, 39 | 308, 40 | 317, 41 | 321, 42 | 331, 43 | 332, 44 | 342, 45 | 364, 46 | 369, 47 | 386, 48 | 391, 49 | 392, 50 | 394, 51 | 399, 52 | 406, 53 | 420, 54 | 428, 55 | 440, 56 | 444, 57 | 459, 58 | 473, 59 | 477, 60 | 485, 61 | 487, 62 | 494, 63 | 495, 64 | 546, 65 | 554, 66 | 561, 67 | 562, 68 | 574, 69 | 584, 70 | 611, 71 | 619, 72 | 638, 73 | 652, 74 | 654, 75 | 667, 76 | 675, 77 | 676, 78 | 678, 79 | 683, 80 | 696, 81 | 698, 82 | 730, 83 | 732, 84 | 737, 85 | 739, 86 | 749, 87 | 759, 88 | 761, 89 | 763, 90 | 792, 91 | 802, 92 | 809, 93 | 826, 94 | 847, 95 | 848, 96 | 857, 97 | 860, 98 | 861, 99 | 873, 100 | 878, 101 | 894, 102 | 896, 103 | 901, 104 | 909, 105 | 923, 106 | 934, 107 | 952, 108 | 967, 109 | 992, 110 | 1012, 111 | 1013, 112 | 1023, 113 | 1030, 114 | 1034, 115 | 1036, 116 | 1041, 117 | 1045, 118 | 1056, 119 | 1057, 120 | 1080, 121 | 1088, 122 | 1126, 123 | 1133, 124 | 1161, 125 | 1172, 126 | 1178, 127 | 1184, 128 | 1190, 129 | 1199, 130 | 1202, 131 | 1203, 132 | 1208, 133 | 1224, 134 | 1229, 135 | 1247, 136 | 1274, 137 | 1275, 138 | 1278, 139 | 1287, 140 | 1289, 141 | 1290, 142 | 1313, 143 | 1322, 144 | 1329, 145 | 1330, 146 | 1353, 147 | 1356, 148 | 1358, 149 | 1359, 150 | 1372, 151 | 1380, 152 | 1391, 153 | 1403, 154 | 1419, 155 | 1444, 156 | 1451, 157 | 1467, 158 | 1468, 159 | 1481, 160 | 1482, 161 | 1484, 162 | 1508, 163 | 1512, 164 | 1513, 165 | 1514, 166 | 1515, 167 | 1530, 168 | 1532, 169 | 1536, 170 | 1555, 171 | 1574, 172 | 1591, 173 | 1610, 174 | 1624, 175 | 1629 176 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 4, 3 | 6, 4 | 20, 5 | 26, 6 | 52, 7 | 59, 8 | 60, 9 | 65, 10 | 66, 11 | 69, 12 | 70, 13 | 84, 14 | 86, 15 | 87, 16 | 92, 17 | 93, 18 | 94, 19 | 111, 20 | 112, 21 | 123, 22 | 135, 23 | 138, 24 | 139, 25 | 158, 26 | 169, 27 | 175, 28 | 189, 29 | 207, 30 | 220, 31 | 223, 32 | 238, 33 | 243, 34 | 253, 35 | 269, 36 | 277, 37 | 281, 38 | 293, 39 | 310, 40 | 320, 41 | 330, 42 | 349, 43 | 359, 44 | 372, 45 | 379, 46 | 388, 47 | 403, 48 | 405, 49 | 418, 50 | 423, 51 | 429, 52 | 432, 53 | 437, 54 | 450, 55 | 458, 56 | 461, 57 | 467, 58 | 497, 59 | 553, 60 | 564, 61 | 571, 62 | 593, 63 | 594, 64 | 606, 65 | 610, 66 | 614, 67 | 615, 68 | 617, 69 | 627, 70 | 636, 71 | 677, 72 | 689, 73 | 692, 74 | 701, 75 | 729, 76 | 770, 77 | 776, 78 | 796, 79 | 821, 80 | 863, 81 | 869, 82 | 876, 83 | 882, 84 | 898, 85 | 922, 86 | 928, 87 | 930, 88 | 936, 89 | 940, 90 | 943, 91 | 959, 92 | 960, 93 | 964, 94 | 985, 95 | 1018, 96 | 1024, 97 | 1058, 98 | 1066, 99 | 1073, 100 | 1076, 101 | 1092, 102 | 1094, 103 | 1095, 104 | 1103, 105 | 1125, 106 | 1130, 107 | 1131, 108 | 1152, 109 | 1157, 110 | 1160, 111 | 1173, 112 | 1192, 113 | 1204, 114 | 1213, 115 | 1220, 116 | 1221, 117 | 1225, 118 | 1256, 119 | 1266, 120 | 1267, 121 | 1277, 122 | 1280, 123 | 1283, 124 | 1297, 125 | 1307, 126 | 1316, 127 | 1319, 128 | 1324, 129 | 1333, 130 | 1352, 131 | 1360, 132 | 1382, 133 | 1428, 134 | 1447, 135 | 1452, 136 | 1462, 137 | 1483, 138 | 1490, 139 | 1496, 140 | 1522, 141 | 1525, 142 | 1528, 143 | 1537, 144 | 1541, 145 | 1556, 146 | 1558, 147 | 1560, 148 | 1565, 149 | 1590, 150 | 1594, 151 | 1605, 152 | 1615, 153 | 1628, 154 | 1631 155 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 16, 4 | 62, 5 | 64, 6 | 85, 7 | 104, 8 | 120, 9 | 137, 10 | 176, 11 | 177, 12 | 182, 13 | 210, 14 | 218, 15 | 225, 16 | 226, 17 | 237, 18 | 241, 19 | 244, 20 | 264, 21 | 265, 22 | 274, 23 | 275, 24 | 278, 25 | 282, 26 | 285, 27 | 288, 28 | 289, 29 | 297, 30 | 304, 31 | 309, 32 | 313, 33 | 322, 34 | 327, 35 | 336, 36 | 352, 37 | 354, 38 | 371, 39 | 374, 40 | 387, 41 | 409, 42 | 411, 43 | 412, 44 | 433, 45 | 436, 46 | 443, 47 | 466, 48 | 471, 49 | 508, 50 | 519, 51 | 526, 52 | 551, 53 | 557, 54 | 587, 55 | 590, 56 | 595, 57 | 603, 58 | 620, 59 | 635, 60 | 659, 61 | 682, 62 | 686, 63 | 694, 64 | 705, 65 | 720, 66 | 742, 67 | 765, 68 | 774, 69 | 778, 70 | 798, 71 | 800, 72 | 804, 73 | 824, 74 | 836, 75 | 840, 76 | 845, 77 | 871, 78 | 872, 79 | 874, 80 | 887, 81 | 897, 82 | 905, 83 | 907, 84 | 913, 85 | 925, 86 | 931, 87 | 937, 88 | 962, 89 | 963, 90 | 979, 91 | 983, 92 | 990, 93 | 991, 94 | 1022, 95 | 1029, 96 | 1037, 97 | 1042, 98 | 1050, 99 | 1059, 100 | 1079, 101 | 1085, 102 | 1087, 103 | 1098, 104 | 1101, 105 | 1123, 106 | 1129, 107 | 1132, 108 | 1142, 109 | 1153, 110 | 1162, 111 | 1174, 112 | 1176, 113 | 1177, 114 | 1181, 115 | 1185, 116 | 1197, 117 | 1205, 118 | 1214, 119 | 1234, 120 | 1236, 121 | 1240, 122 | 1245, 123 | 1250, 124 | 1251, 125 | 1257, 126 | 1265, 127 | 1272, 128 | 1279, 129 | 1312, 130 | 1320, 131 | 1331, 132 | 1342, 133 | 1346, 134 | 1351, 135 | 1367, 136 | 1376, 137 | 1387, 138 | 1399, 139 | 1417, 140 | 1425, 141 | 1437, 142 | 1441, 143 | 1443, 144 | 1448, 145 | 1455, 146 | 1457, 147 | 1473, 148 | 1480, 149 | 1488, 150 | 1494, 151 | 1495, 152 | 1503, 153 | 1504, 154 | 1506, 155 | 1507, 156 | 1520, 157 | 1524, 158 | 1529, 159 | 1534, 160 | 1542, 161 | 1549, 162 | 1564, 163 | 1579, 164 | 1604, 165 | 1607, 166 | 1617, 167 | 1621 168 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 5, 4 | 13, 5 | 35, 6 | 51, 7 | 53, 8 | 78, 9 | 88, 10 | 95, 11 | 98, 12 | 115, 13 | 117, 14 | 143, 15 | 144, 16 | 147, 17 | 151, 18 | 185, 19 | 195, 20 | 198, 21 | 202, 22 | 221, 23 | 224, 24 | 229, 25 | 230, 26 | 234, 27 | 236, 28 | 257, 29 | 286, 30 | 296, 31 | 305, 32 | 316, 33 | 326, 34 | 337, 35 | 341, 36 | 343, 37 | 363, 38 | 368, 39 | 373, 40 | 376, 41 | 377, 42 | 384, 43 | 415, 44 | 430, 45 | 447, 46 | 448, 47 | 452, 48 | 465, 49 | 470, 50 | 474, 51 | 488, 52 | 515, 53 | 518, 54 | 528, 55 | 531, 56 | 532, 57 | 541, 58 | 545, 59 | 559, 60 | 566, 61 | 567, 62 | 580, 63 | 588, 64 | 589, 65 | 598, 66 | 612, 67 | 622, 68 | 633, 69 | 642, 70 | 661, 71 | 662, 72 | 664, 73 | 695, 74 | 703, 75 | 706, 76 | 712, 77 | 717, 78 | 725, 79 | 740, 80 | 748, 81 | 750, 82 | 754, 83 | 755, 84 | 773, 85 | 803, 86 | 823, 87 | 825, 88 | 830, 89 | 834, 90 | 843, 91 | 852, 92 | 866, 93 | 867, 94 | 875, 95 | 880, 96 | 884, 97 | 886, 98 | 889, 99 | 961, 100 | 968, 101 | 970, 102 | 972, 103 | 978, 104 | 984, 105 | 1017, 106 | 1025, 107 | 1027, 108 | 1032, 109 | 1048, 110 | 1070, 111 | 1071, 112 | 1072, 113 | 1078, 114 | 1084, 115 | 1102, 116 | 1122, 117 | 1135, 118 | 1146, 119 | 1168, 120 | 1195, 121 | 1209, 122 | 1217, 123 | 1218, 124 | 1248, 125 | 1249, 126 | 1299, 127 | 1302, 128 | 1308, 129 | 1310, 130 | 1315, 131 | 1317, 132 | 1325, 133 | 1335, 134 | 1344, 135 | 1349, 136 | 1355, 137 | 1366, 138 | 1385, 139 | 1398, 140 | 1404, 141 | 1407, 142 | 1416, 143 | 1422, 144 | 1423, 145 | 1426, 146 | 1430, 147 | 1435, 148 | 1436, 149 | 1439, 150 | 1459, 151 | 1510, 152 | 1535, 153 | 1552, 154 | 1554, 155 | 1559, 156 | 1573, 157 | 1585, 158 | 1593, 159 | 1597, 160 | 1598, 161 | 1611, 162 | 1625, 163 | 1627 164 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/hackernews/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 19, 3 | 27, 4 | 28, 5 | 42, 6 | 57, 7 | 71, 8 | 81, 9 | 82, 10 | 101, 11 | 113, 12 | 118, 13 | 122, 14 | 125, 15 | 141, 16 | 148, 17 | 157, 18 | 164, 19 | 166, 20 | 171, 21 | 215, 22 | 222, 23 | 231, 24 | 233, 25 | 250, 26 | 258, 27 | 266, 28 | 280, 29 | 298, 30 | 333, 31 | 347, 32 | 357, 33 | 361, 34 | 404, 35 | 414, 36 | 424, 37 | 426, 38 | 431, 39 | 456, 40 | 462, 41 | 491, 42 | 517, 43 | 522, 44 | 524, 45 | 530, 46 | 542, 47 | 544, 48 | 568, 49 | 569, 50 | 577, 51 | 607, 52 | 618, 53 | 629, 54 | 641, 55 | 647, 56 | 651, 57 | 666, 58 | 668, 59 | 687, 60 | 690, 61 | 707, 62 | 710, 63 | 713, 64 | 715, 65 | 727, 66 | 733, 67 | 743, 68 | 745, 69 | 753, 70 | 757, 71 | 772, 72 | 779, 73 | 783, 74 | 787, 75 | 793, 76 | 799, 77 | 812, 78 | 828, 79 | 833, 80 | 877, 81 | 881, 82 | 883, 83 | 888, 84 | 892, 85 | 900, 86 | 915, 87 | 916, 88 | 929, 89 | 938, 90 | 942, 91 | 973, 92 | 977, 93 | 1001, 94 | 1019, 95 | 1020, 96 | 1038, 97 | 1047, 98 | 1060, 99 | 1063, 100 | 1064, 101 | 1075, 102 | 1077, 103 | 1106, 104 | 1109, 105 | 1115, 106 | 1116, 107 | 1117, 108 | 1136, 109 | 1139, 110 | 1143, 111 | 1151, 112 | 1154, 113 | 1155, 114 | 1156, 115 | 1180, 116 | 1183, 117 | 1193, 118 | 1206, 119 | 1216, 120 | 1223, 121 | 1243, 122 | 1255, 123 | 1281, 124 | 1284, 125 | 1286, 126 | 1301, 127 | 1309, 128 | 1365, 129 | 1370, 130 | 1371, 131 | 1373, 132 | 1375, 133 | 1379, 134 | 1383, 135 | 1405, 136 | 1421, 137 | 1431, 138 | 1445, 139 | 1456, 140 | 1461, 141 | 1463, 142 | 1464, 143 | 1466, 144 | 1474, 145 | 1477, 146 | 1498, 147 | 1500, 148 | 1518, 149 | 1523, 150 | 1531, 151 | 1533, 152 | 1566, 153 | 1576, 154 | 1577, 155 | 1586, 156 | 1619, 157 | 1626 158 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 17, 4 | 37, 5 | 60, 6 | 67, 7 | 86, 8 | 106, 9 | 111, 10 | 151, 11 | 177, 12 | 188, 13 | 194, 14 | 206, 15 | 220, 16 | 226, 17 | 240, 18 | 254, 19 | 256, 20 | 258, 21 | 259, 22 | 280, 23 | 287, 24 | 292, 25 | 298, 26 | 304, 27 | 319, 28 | 355, 29 | 366, 30 | 373, 31 | 381, 32 | 390, 33 | 395, 34 | 396, 35 | 413, 36 | 416, 37 | 419, 38 | 425, 39 | 434, 40 | 443, 41 | 495, 42 | 510, 43 | 530, 44 | 540, 45 | 555, 46 | 558, 47 | 585, 48 | 596, 49 | 598, 50 | 606, 51 | 613, 52 | 619, 53 | 627, 54 | 628, 55 | 638, 56 | 646, 57 | 651, 58 | 654, 59 | 676, 60 | 677, 61 | 680, 62 | 699, 63 | 704, 64 | 724, 65 | 738, 66 | 747, 67 | 757, 68 | 768, 69 | 769, 70 | 774, 71 | 776, 72 | 781, 73 | 783, 74 | 785, 75 | 811, 76 | 815, 77 | 832, 78 | 838, 79 | 857, 80 | 859, 81 | 866, 82 | 867, 83 | 908, 84 | 929, 85 | 932, 86 | 954, 87 | 955, 88 | 962, 89 | 966, 90 | 970, 91 | 974, 92 | 1008, 93 | 1011, 94 | 1013, 95 | 1015, 96 | 1031, 97 | 1051, 98 | 1067, 99 | 1072, 100 | 1075, 101 | 1077, 102 | 1082, 103 | 1083, 104 | 1103, 105 | 1119, 106 | 1122, 107 | 1133, 108 | 1140, 109 | 1147, 110 | 1152, 111 | 1158, 112 | 1159, 113 | 1165, 114 | 1168, 115 | 1171, 116 | 1174, 117 | 1176, 118 | 1184, 119 | 1186, 120 | 1204, 121 | 1212, 122 | 1219, 123 | 1228, 124 | 1253, 125 | 1269, 126 | 1271, 127 | 1277, 128 | 1284, 129 | 1292, 130 | 1299, 131 | 1314, 132 | 1337, 133 | 1363, 134 | 1379, 135 | 1389, 136 | 1393, 137 | 1395, 138 | 1422, 139 | 1423, 140 | 1425, 141 | 1448, 142 | 1449, 143 | 1454, 144 | 1463, 145 | 1468, 146 | 1477, 147 | 1481, 148 | 1490, 149 | 1506, 150 | 1529, 151 | 1530, 152 | 1534, 153 | 1537, 154 | 1549, 155 | 1554, 156 | 1557, 157 | 1568, 158 | 1608, 159 | 1618, 160 | 1619, 161 | 1621, 162 | 1625, 163 | 1638, 164 | 1645, 165 | 1659, 166 | 1662, 167 | 1666, 168 | 1669, 169 | 1683, 170 | 1686, 171 | 1698, 172 | 1711, 173 | 1714, 174 | 1716, 175 | 1723, 176 | 1728, 177 | 1743, 178 | 1747, 179 | 1752, 180 | 1754, 181 | 1765, 182 | 1774, 183 | 1787, 184 | 1797, 185 | 1800, 186 | 1821, 187 | 1822, 188 | 1832, 189 | 1838, 190 | 1869 191 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 13, 3 | 30, 4 | 31, 5 | 34, 6 | 40, 7 | 50, 8 | 51, 9 | 52, 10 | 55, 11 | 80, 12 | 108, 13 | 126, 14 | 128, 15 | 132, 16 | 133, 17 | 137, 18 | 138, 19 | 162, 20 | 180, 21 | 190, 22 | 191, 23 | 195, 24 | 199, 25 | 222, 26 | 233, 27 | 241, 28 | 245, 29 | 252, 30 | 267, 31 | 278, 32 | 281, 33 | 288, 34 | 291, 35 | 300, 36 | 317, 37 | 332, 38 | 333, 39 | 338, 40 | 345, 41 | 386, 42 | 397, 43 | 408, 44 | 409, 45 | 412, 46 | 422, 47 | 435, 48 | 442, 49 | 448, 50 | 455, 51 | 466, 52 | 472, 53 | 477, 54 | 484, 55 | 492, 56 | 519, 57 | 520, 58 | 521, 59 | 534, 60 | 538, 61 | 541, 62 | 569, 63 | 573, 64 | 575, 65 | 579, 66 | 581, 67 | 594, 68 | 656, 69 | 681, 70 | 695, 71 | 713, 72 | 720, 73 | 730, 74 | 741, 75 | 748, 76 | 751, 77 | 763, 78 | 772, 79 | 790, 80 | 798, 81 | 802, 82 | 809, 83 | 839, 84 | 864, 85 | 910, 86 | 914, 87 | 939, 88 | 949, 89 | 952, 90 | 957, 91 | 976, 92 | 989, 93 | 994, 94 | 995, 95 | 997, 96 | 998, 97 | 999, 98 | 1017, 99 | 1042, 100 | 1049, 101 | 1053, 102 | 1057, 103 | 1059, 104 | 1065, 105 | 1068, 106 | 1069, 107 | 1071, 108 | 1092, 109 | 1104, 110 | 1135, 111 | 1157, 112 | 1183, 113 | 1199, 114 | 1216, 115 | 1224, 116 | 1230, 117 | 1244, 118 | 1247, 119 | 1249, 120 | 1259, 121 | 1264, 122 | 1273, 123 | 1281, 124 | 1283, 125 | 1285, 126 | 1294, 127 | 1304, 128 | 1308, 129 | 1310, 130 | 1317, 131 | 1333, 132 | 1347, 133 | 1356, 134 | 1359, 135 | 1371, 136 | 1398, 137 | 1419, 138 | 1421, 139 | 1452, 140 | 1458, 141 | 1462, 142 | 1469, 143 | 1471, 144 | 1473, 145 | 1479, 146 | 1495, 147 | 1508, 148 | 1509, 149 | 1516, 150 | 1521, 151 | 1522, 152 | 1538, 153 | 1543, 154 | 1544, 155 | 1552, 156 | 1562, 157 | 1567, 158 | 1573, 159 | 1588, 160 | 1591, 161 | 1605, 162 | 1631, 163 | 1639, 164 | 1671, 165 | 1674, 166 | 1687, 167 | 1689, 168 | 1690, 169 | 1692, 170 | 1693, 171 | 1715, 172 | 1720, 173 | 1736, 174 | 1742, 175 | 1750, 176 | 1760, 177 | 1767, 178 | 1773, 179 | 1789, 180 | 1802, 181 | 1810, 182 | 1812, 183 | 1816, 184 | 1824, 185 | 1833, 186 | 1853, 187 | 1855, 188 | 1856, 189 | 1863, 190 | 1874 191 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 5, 3 | 11, 4 | 39, 5 | 44, 6 | 49, 7 | 66, 8 | 78, 9 | 85, 10 | 87, 11 | 98, 12 | 105, 13 | 107, 14 | 112, 15 | 142, 16 | 147, 17 | 153, 18 | 160, 19 | 163, 20 | 170, 21 | 172, 22 | 174, 23 | 211, 24 | 213, 25 | 216, 26 | 217, 27 | 228, 28 | 235, 29 | 302, 30 | 306, 31 | 307, 32 | 308, 33 | 310, 34 | 323, 35 | 331, 36 | 342, 37 | 351, 38 | 359, 39 | 360, 40 | 362, 41 | 369, 42 | 379, 43 | 389, 44 | 391, 45 | 400, 46 | 403, 47 | 433, 48 | 438, 49 | 446, 50 | 451, 51 | 452, 52 | 469, 53 | 475, 54 | 476, 55 | 489, 56 | 493, 57 | 496, 58 | 498, 59 | 499, 60 | 506, 61 | 513, 62 | 516, 63 | 518, 64 | 522, 65 | 526, 66 | 532, 67 | 536, 68 | 576, 69 | 590, 70 | 591, 71 | 593, 72 | 645, 73 | 652, 74 | 655, 75 | 672, 76 | 690, 77 | 711, 78 | 722, 79 | 735, 80 | 736, 81 | 737, 82 | 746, 83 | 755, 84 | 759, 85 | 762, 86 | 765, 87 | 780, 88 | 792, 89 | 794, 90 | 841, 91 | 842, 92 | 868, 93 | 874, 94 | 879, 95 | 880, 96 | 896, 97 | 902, 98 | 923, 99 | 931, 100 | 934, 101 | 947, 102 | 958, 103 | 961, 104 | 993, 105 | 1005, 106 | 1007, 107 | 1022, 108 | 1025, 109 | 1028, 110 | 1038, 111 | 1052, 112 | 1055, 113 | 1061, 114 | 1090, 115 | 1098, 116 | 1118, 117 | 1127, 118 | 1141, 119 | 1143, 120 | 1149, 121 | 1164, 122 | 1189, 123 | 1193, 124 | 1194, 125 | 1200, 126 | 1201, 127 | 1210, 128 | 1217, 129 | 1233, 130 | 1242, 131 | 1248, 132 | 1280, 133 | 1297, 134 | 1305, 135 | 1322, 136 | 1323, 137 | 1338, 138 | 1345, 139 | 1346, 140 | 1350, 141 | 1367, 142 | 1373, 143 | 1376, 144 | 1396, 145 | 1404, 146 | 1411, 147 | 1412, 148 | 1416, 149 | 1426, 150 | 1432, 151 | 1455, 152 | 1461, 153 | 1470, 154 | 1474, 155 | 1482, 156 | 1489, 157 | 1507, 158 | 1511, 159 | 1541, 160 | 1550, 161 | 1560, 162 | 1571, 163 | 1580, 164 | 1606, 165 | 1610, 166 | 1613, 167 | 1617, 168 | 1623, 169 | 1626, 170 | 1627, 171 | 1632, 172 | 1646, 173 | 1667, 174 | 1675, 175 | 1676, 176 | 1695, 177 | 1699, 178 | 1703, 179 | 1763, 180 | 1780, 181 | 1808, 182 | 1814, 183 | 1815, 184 | 1830, 185 | 1842, 186 | 1857, 187 | 1865, 188 | 1866, 189 | 1873, 190 | 1883 191 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 9, 4 | 10, 5 | 12, 6 | 42, 7 | 47, 8 | 58, 9 | 71, 10 | 75, 11 | 83, 12 | 89, 13 | 96, 14 | 125, 15 | 130, 16 | 134, 17 | 140, 18 | 141, 19 | 144, 20 | 149, 21 | 169, 22 | 181, 23 | 187, 24 | 192, 25 | 196, 26 | 198, 27 | 210, 28 | 218, 29 | 237, 30 | 246, 31 | 248, 32 | 265, 33 | 271, 34 | 285, 35 | 286, 36 | 290, 37 | 311, 38 | 325, 39 | 335, 40 | 339, 41 | 347, 42 | 348, 43 | 364, 44 | 368, 45 | 375, 46 | 376, 47 | 382, 48 | 384, 49 | 385, 50 | 388, 51 | 399, 52 | 410, 53 | 411, 54 | 420, 55 | 426, 56 | 450, 57 | 457, 58 | 460, 59 | 461, 60 | 465, 61 | 479, 62 | 486, 63 | 504, 64 | 508, 65 | 545, 66 | 548, 67 | 551, 68 | 553, 69 | 603, 70 | 609, 71 | 621, 72 | 630, 73 | 637, 74 | 659, 75 | 662, 76 | 664, 77 | 682, 78 | 684, 79 | 689, 80 | 697, 81 | 714, 82 | 716, 83 | 719, 84 | 723, 85 | 729, 86 | 758, 87 | 777, 88 | 784, 89 | 803, 90 | 810, 91 | 821, 92 | 822, 93 | 824, 94 | 827, 95 | 847, 96 | 849, 97 | 869, 98 | 883, 99 | 888, 100 | 889, 101 | 898, 102 | 907, 103 | 911, 104 | 920, 105 | 933, 106 | 938, 107 | 943, 108 | 953, 109 | 956, 110 | 965, 111 | 978, 112 | 979, 113 | 986, 114 | 1001, 115 | 1026, 116 | 1036, 117 | 1040, 118 | 1084, 119 | 1091, 120 | 1106, 121 | 1108, 122 | 1110, 123 | 1128, 124 | 1136, 125 | 1144, 126 | 1146, 127 | 1156, 128 | 1167, 129 | 1172, 130 | 1175, 131 | 1181, 132 | 1185, 133 | 1197, 134 | 1198, 135 | 1202, 136 | 1208, 137 | 1211, 138 | 1218, 139 | 1225, 140 | 1232, 141 | 1237, 142 | 1265, 143 | 1278, 144 | 1289, 145 | 1291, 146 | 1295, 147 | 1298, 148 | 1320, 149 | 1326, 150 | 1341, 151 | 1351, 152 | 1362, 153 | 1385, 154 | 1390, 155 | 1409, 156 | 1414, 157 | 1415, 158 | 1424, 159 | 1427, 160 | 1434, 161 | 1441, 162 | 1444, 163 | 1487, 164 | 1488, 165 | 1505, 166 | 1524, 167 | 1535, 168 | 1581, 169 | 1604, 170 | 1611, 171 | 1612, 172 | 1634, 173 | 1641, 174 | 1651, 175 | 1664, 176 | 1718, 177 | 1722, 178 | 1733, 179 | 1738, 180 | 1762, 181 | 1764, 182 | 1772, 183 | 1804, 184 | 1818, 185 | 1823, 186 | 1839, 187 | 1848, 188 | 1858, 189 | 1870, 190 | 1879 191 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 19, 4 | 26, 5 | 56, 6 | 59, 7 | 64, 8 | 70, 9 | 76, 10 | 79, 11 | 88, 12 | 97, 13 | 110, 14 | 113, 15 | 129, 16 | 139, 17 | 148, 18 | 157, 19 | 168, 20 | 178, 21 | 193, 22 | 204, 23 | 208, 24 | 225, 25 | 227, 26 | 236, 27 | 239, 28 | 243, 29 | 249, 30 | 266, 31 | 268, 32 | 270, 33 | 275, 34 | 277, 35 | 283, 36 | 299, 37 | 303, 38 | 316, 39 | 327, 40 | 330, 41 | 365, 42 | 387, 43 | 407, 44 | 414, 45 | 445, 46 | 468, 47 | 478, 48 | 480, 49 | 483, 50 | 502, 51 | 514, 52 | 527, 53 | 542, 54 | 554, 55 | 556, 56 | 561, 57 | 563, 58 | 566, 59 | 571, 60 | 572, 61 | 578, 62 | 602, 63 | 604, 64 | 612, 65 | 626, 66 | 640, 67 | 657, 68 | 658, 69 | 661, 70 | 663, 71 | 674, 72 | 679, 73 | 685, 74 | 687, 75 | 696, 76 | 700, 77 | 728, 78 | 742, 79 | 756, 80 | 787, 81 | 791, 82 | 801, 83 | 819, 84 | 820, 85 | 826, 86 | 830, 87 | 848, 88 | 851, 89 | 860, 90 | 862, 91 | 863, 92 | 877, 93 | 885, 94 | 890, 95 | 895, 96 | 897, 97 | 899, 98 | 906, 99 | 909, 100 | 918, 101 | 922, 102 | 926, 103 | 927, 104 | 944, 105 | 960, 106 | 969, 107 | 988, 108 | 996, 109 | 1010, 110 | 1018, 111 | 1029, 112 | 1030, 113 | 1056, 114 | 1058, 115 | 1062, 116 | 1073, 117 | 1076, 118 | 1081, 119 | 1085, 120 | 1095, 121 | 1105, 122 | 1112, 123 | 1126, 124 | 1145, 125 | 1150, 126 | 1153, 127 | 1166, 128 | 1190, 129 | 1195, 130 | 1223, 131 | 1229, 132 | 1231, 133 | 1266, 134 | 1274, 135 | 1275, 136 | 1288, 137 | 1303, 138 | 1307, 139 | 1309, 140 | 1319, 141 | 1327, 142 | 1331, 143 | 1339, 144 | 1357, 145 | 1358, 146 | 1366, 147 | 1377, 148 | 1383, 149 | 1391, 150 | 1397, 151 | 1399, 152 | 1400, 153 | 1403, 154 | 1407, 155 | 1429, 156 | 1435, 157 | 1460, 158 | 1466, 159 | 1493, 160 | 1499, 161 | 1518, 162 | 1525, 163 | 1532, 164 | 1542, 165 | 1545, 166 | 1569, 167 | 1576, 168 | 1579, 169 | 1582, 170 | 1583, 171 | 1584, 172 | 1589, 173 | 1595, 174 | 1596, 175 | 1630, 176 | 1647, 177 | 1648, 178 | 1649, 179 | 1668, 180 | 1670, 181 | 1682, 182 | 1702, 183 | 1712, 184 | 1730, 185 | 1735, 186 | 1759, 187 | 1782, 188 | 1798, 189 | 1835, 190 | 1859 191 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 14, 3 | 21, 4 | 22, 5 | 27, 6 | 29, 7 | 57, 8 | 72, 9 | 73, 10 | 74, 11 | 93, 12 | 109, 13 | 120, 14 | 136, 15 | 143, 16 | 152, 17 | 156, 18 | 167, 19 | 171, 20 | 175, 21 | 176, 22 | 179, 23 | 184, 24 | 200, 25 | 205, 26 | 219, 27 | 229, 28 | 273, 29 | 274, 30 | 282, 31 | 289, 32 | 322, 33 | 326, 34 | 358, 35 | 367, 36 | 374, 37 | 393, 38 | 415, 39 | 417, 40 | 423, 41 | 428, 42 | 429, 43 | 437, 44 | 449, 45 | 458, 46 | 459, 47 | 471, 48 | 473, 49 | 487, 50 | 488, 51 | 491, 52 | 505, 53 | 507, 54 | 517, 55 | 529, 56 | 539, 57 | 565, 58 | 588, 59 | 592, 60 | 601, 61 | 614, 62 | 617, 63 | 622, 64 | 669, 65 | 670, 66 | 709, 67 | 732, 68 | 752, 69 | 753, 70 | 788, 71 | 797, 72 | 814, 73 | 818, 74 | 823, 75 | 833, 76 | 837, 77 | 843, 78 | 845, 79 | 850, 80 | 872, 81 | 873, 82 | 884, 83 | 903, 84 | 917, 85 | 924, 86 | 937, 87 | 959, 88 | 975, 89 | 984, 90 | 991, 91 | 1002, 92 | 1009, 93 | 1041, 94 | 1044, 95 | 1045, 96 | 1047, 97 | 1064, 98 | 1074, 99 | 1107, 100 | 1114, 101 | 1117, 102 | 1125, 103 | 1132, 104 | 1134, 105 | 1148, 106 | 1160, 107 | 1161, 108 | 1191, 109 | 1207, 110 | 1220, 111 | 1222, 112 | 1272, 113 | 1286, 114 | 1293, 115 | 1301, 116 | 1306, 117 | 1313, 118 | 1315, 119 | 1316, 120 | 1321, 121 | 1343, 122 | 1408, 123 | 1413, 124 | 1417, 125 | 1418, 126 | 1420, 127 | 1430, 128 | 1437, 129 | 1440, 130 | 1445, 131 | 1465, 132 | 1467, 133 | 1475, 134 | 1478, 135 | 1484, 136 | 1486, 137 | 1491, 138 | 1492, 139 | 1503, 140 | 1513, 141 | 1514, 142 | 1533, 143 | 1539, 144 | 1540, 145 | 1547, 146 | 1551, 147 | 1555, 148 | 1556, 149 | 1559, 150 | 1572, 151 | 1590, 152 | 1594, 153 | 1597, 154 | 1600, 155 | 1607, 156 | 1622, 157 | 1629, 158 | 1633, 159 | 1637, 160 | 1650, 161 | 1653, 162 | 1655, 163 | 1656, 164 | 1658, 165 | 1673, 166 | 1678, 167 | 1680, 168 | 1684, 169 | 1696, 170 | 1700, 171 | 1705, 172 | 1708, 173 | 1709, 174 | 1726, 175 | 1741, 176 | 1749, 177 | 1751, 178 | 1771, 179 | 1784, 180 | 1786, 181 | 1791, 182 | 1794, 183 | 1796, 184 | 1799, 185 | 1834, 186 | 1845, 187 | 1867, 188 | 1875, 189 | 1877 190 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 6, 3 | 8, 4 | 23, 5 | 32, 6 | 38, 7 | 53, 8 | 54, 9 | 62, 10 | 82, 11 | 84, 12 | 90, 13 | 92, 14 | 94, 15 | 95, 16 | 115, 17 | 131, 18 | 145, 19 | 155, 20 | 161, 21 | 173, 22 | 182, 23 | 185, 24 | 197, 25 | 201, 26 | 207, 27 | 215, 28 | 230, 29 | 231, 30 | 234, 31 | 238, 32 | 251, 33 | 253, 34 | 262, 35 | 263, 36 | 276, 37 | 295, 38 | 297, 39 | 312, 40 | 315, 41 | 329, 42 | 343, 43 | 352, 44 | 361, 45 | 378, 46 | 394, 47 | 418, 48 | 421, 49 | 440, 50 | 441, 51 | 467, 52 | 503, 53 | 528, 54 | 567, 55 | 600, 56 | 618, 57 | 623, 58 | 625, 59 | 631, 60 | 634, 61 | 660, 62 | 673, 63 | 686, 64 | 688, 65 | 701, 66 | 702, 67 | 706, 68 | 707, 69 | 708, 70 | 710, 71 | 712, 72 | 717, 73 | 718, 74 | 726, 75 | 740, 76 | 745, 77 | 760, 78 | 764, 79 | 766, 80 | 775, 81 | 782, 82 | 807, 83 | 852, 84 | 853, 85 | 854, 86 | 855, 87 | 875, 88 | 901, 89 | 904, 90 | 915, 91 | 921, 92 | 935, 93 | 940, 94 | 951, 95 | 963, 96 | 964, 97 | 972, 98 | 980, 99 | 985, 100 | 1003, 101 | 1016, 102 | 1024, 103 | 1034, 104 | 1066, 105 | 1088, 106 | 1089, 107 | 1099, 108 | 1102, 109 | 1113, 110 | 1121, 111 | 1129, 112 | 1142, 113 | 1154, 114 | 1162, 115 | 1188, 116 | 1192, 117 | 1203, 118 | 1205, 119 | 1234, 120 | 1243, 121 | 1245, 122 | 1252, 123 | 1256, 124 | 1257, 125 | 1260, 126 | 1267, 127 | 1276, 128 | 1282, 129 | 1312, 130 | 1330, 131 | 1332, 132 | 1344, 133 | 1348, 134 | 1349, 135 | 1365, 136 | 1370, 137 | 1372, 138 | 1375, 139 | 1384, 140 | 1392, 141 | 1402, 142 | 1405, 143 | 1436, 144 | 1446, 145 | 1451, 146 | 1456, 147 | 1476, 148 | 1480, 149 | 1494, 150 | 1519, 151 | 1548, 152 | 1558, 153 | 1574, 154 | 1575, 155 | 1577, 156 | 1586, 157 | 1592, 158 | 1593, 159 | 1598, 160 | 1616, 161 | 1620, 162 | 1636, 163 | 1642, 164 | 1643, 165 | 1654, 166 | 1665, 167 | 1672, 168 | 1681, 169 | 1691, 170 | 1706, 171 | 1717, 172 | 1727, 173 | 1740, 174 | 1757, 175 | 1775, 176 | 1779, 177 | 1785, 178 | 1793, 179 | 1807, 180 | 1825, 181 | 1831, 182 | 1840, 183 | 1844, 184 | 1846, 185 | 1851, 186 | 1861, 187 | 1862, 188 | 1876, 189 | 1878 190 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 4, 4 | 15, 5 | 16, 6 | 18, 7 | 20, 8 | 25, 9 | 28, 10 | 36, 11 | 63, 12 | 91, 13 | 118, 14 | 119, 15 | 122, 16 | 123, 17 | 127, 18 | 135, 19 | 146, 20 | 154, 21 | 158, 22 | 183, 23 | 212, 24 | 221, 25 | 242, 26 | 247, 27 | 257, 28 | 261, 29 | 269, 30 | 284, 31 | 293, 32 | 301, 33 | 309, 34 | 318, 35 | 336, 36 | 340, 37 | 350, 38 | 353, 39 | 354, 40 | 356, 41 | 357, 42 | 363, 43 | 371, 44 | 398, 45 | 404, 46 | 405, 47 | 406, 48 | 424, 49 | 430, 50 | 431, 51 | 447, 52 | 454, 53 | 462, 54 | 490, 55 | 500, 56 | 525, 57 | 549, 58 | 560, 59 | 568, 60 | 584, 61 | 589, 62 | 610, 63 | 615, 64 | 629, 65 | 632, 66 | 633, 67 | 635, 68 | 636, 69 | 641, 70 | 643, 71 | 671, 72 | 675, 73 | 692, 74 | 694, 75 | 703, 76 | 705, 77 | 725, 78 | 727, 79 | 731, 80 | 750, 81 | 754, 82 | 778, 83 | 786, 84 | 793, 85 | 799, 86 | 805, 87 | 806, 88 | 836, 89 | 840, 90 | 858, 91 | 919, 92 | 925, 93 | 930, 94 | 948, 95 | 971, 96 | 973, 97 | 981, 98 | 983, 99 | 987, 100 | 990, 101 | 992, 102 | 1006, 103 | 1021, 104 | 1032, 105 | 1048, 106 | 1080, 107 | 1087, 108 | 1093, 109 | 1094, 110 | 1096, 111 | 1097, 112 | 1109, 113 | 1111, 114 | 1116, 115 | 1123, 116 | 1124, 117 | 1131, 118 | 1138, 119 | 1169, 120 | 1170, 121 | 1173, 122 | 1177, 123 | 1178, 124 | 1179, 125 | 1180, 126 | 1182, 127 | 1187, 128 | 1196, 129 | 1214, 130 | 1215, 131 | 1226, 132 | 1236, 133 | 1238, 134 | 1239, 135 | 1255, 136 | 1258, 137 | 1268, 138 | 1270, 139 | 1302, 140 | 1334, 141 | 1336, 142 | 1340, 143 | 1354, 144 | 1355, 145 | 1394, 146 | 1406, 147 | 1442, 148 | 1457, 149 | 1459, 150 | 1502, 151 | 1504, 152 | 1510, 153 | 1520, 154 | 1523, 155 | 1526, 156 | 1546, 157 | 1578, 158 | 1587, 159 | 1602, 160 | 1603, 161 | 1615, 162 | 1635, 163 | 1661, 164 | 1688, 165 | 1701, 166 | 1704, 167 | 1707, 168 | 1719, 169 | 1721, 170 | 1725, 171 | 1729, 172 | 1731, 173 | 1734, 174 | 1739, 175 | 1745, 176 | 1748, 177 | 1756, 178 | 1769, 179 | 1776, 180 | 1790, 181 | 1792, 182 | 1827, 183 | 1836, 184 | 1843, 185 | 1852, 186 | 1868, 187 | 1872, 188 | 1880, 189 | 1882 190 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 24, 3 | 45, 4 | 61, 5 | 68, 6 | 77, 7 | 99, 8 | 100, 9 | 101, 10 | 102, 11 | 103, 12 | 104, 13 | 114, 14 | 117, 15 | 124, 16 | 164, 17 | 165, 18 | 166, 19 | 209, 20 | 214, 21 | 224, 22 | 244, 23 | 255, 24 | 260, 25 | 279, 26 | 294, 27 | 296, 28 | 313, 29 | 321, 30 | 334, 31 | 337, 32 | 344, 33 | 346, 34 | 377, 35 | 383, 36 | 401, 37 | 436, 38 | 439, 39 | 453, 40 | 463, 41 | 464, 42 | 474, 43 | 481, 44 | 485, 45 | 494, 46 | 509, 47 | 512, 48 | 524, 49 | 531, 50 | 533, 51 | 535, 52 | 537, 53 | 543, 54 | 550, 55 | 552, 56 | 557, 57 | 562, 58 | 580, 59 | 586, 60 | 587, 61 | 595, 62 | 599, 63 | 605, 64 | 607, 65 | 642, 66 | 644, 67 | 647, 68 | 649, 69 | 653, 70 | 665, 71 | 667, 72 | 668, 73 | 683, 74 | 691, 75 | 721, 76 | 733, 77 | 743, 78 | 761, 79 | 770, 80 | 771, 81 | 789, 82 | 808, 83 | 816, 84 | 817, 85 | 825, 86 | 828, 87 | 831, 88 | 856, 89 | 865, 90 | 870, 91 | 876, 92 | 878, 93 | 887, 94 | 893, 95 | 894, 96 | 905, 97 | 941, 98 | 945, 99 | 977, 100 | 982, 101 | 1000, 102 | 1012, 103 | 1020, 104 | 1027, 105 | 1035, 106 | 1037, 107 | 1039, 108 | 1043, 109 | 1046, 110 | 1050, 111 | 1086, 112 | 1101, 113 | 1120, 114 | 1130, 115 | 1151, 116 | 1213, 117 | 1221, 118 | 1240, 119 | 1246, 120 | 1251, 121 | 1254, 122 | 1262, 123 | 1279, 124 | 1296, 125 | 1300, 126 | 1311, 127 | 1318, 128 | 1324, 129 | 1328, 130 | 1329, 131 | 1335, 132 | 1342, 133 | 1360, 134 | 1361, 135 | 1378, 136 | 1380, 137 | 1386, 138 | 1387, 139 | 1410, 140 | 1428, 141 | 1431, 142 | 1433, 143 | 1438, 144 | 1439, 145 | 1443, 146 | 1447, 147 | 1453, 148 | 1464, 149 | 1483, 150 | 1497, 151 | 1531, 152 | 1536, 153 | 1561, 154 | 1564, 155 | 1570, 156 | 1585, 157 | 1601, 158 | 1609, 159 | 1628, 160 | 1640, 161 | 1644, 162 | 1652, 163 | 1660, 164 | 1679, 165 | 1685, 166 | 1697, 167 | 1710, 168 | 1724, 169 | 1746, 170 | 1753, 171 | 1758, 172 | 1761, 173 | 1768, 174 | 1781, 175 | 1783, 176 | 1788, 177 | 1795, 178 | 1803, 179 | 1806, 180 | 1811, 181 | 1813, 182 | 1817, 183 | 1820, 184 | 1837, 185 | 1854, 186 | 1860, 187 | 1864, 188 | 1871, 189 | 1881 190 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/nih-exporter/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 7, 3 | 33, 4 | 35, 5 | 41, 6 | 43, 7 | 46, 8 | 48, 9 | 65, 10 | 69, 11 | 81, 12 | 116, 13 | 121, 14 | 150, 15 | 159, 16 | 186, 17 | 189, 18 | 202, 19 | 203, 20 | 223, 21 | 232, 22 | 250, 23 | 264, 24 | 272, 25 | 305, 26 | 314, 27 | 320, 28 | 324, 29 | 328, 30 | 341, 31 | 349, 32 | 370, 33 | 372, 34 | 380, 35 | 392, 36 | 402, 37 | 427, 38 | 432, 39 | 444, 40 | 456, 41 | 470, 42 | 482, 43 | 497, 44 | 501, 45 | 511, 46 | 515, 47 | 523, 48 | 544, 49 | 546, 50 | 547, 51 | 559, 52 | 564, 53 | 570, 54 | 574, 55 | 577, 56 | 582, 57 | 583, 58 | 597, 59 | 608, 60 | 611, 61 | 616, 62 | 620, 63 | 624, 64 | 639, 65 | 648, 66 | 650, 67 | 666, 68 | 678, 69 | 693, 70 | 698, 71 | 715, 72 | 734, 73 | 739, 74 | 744, 75 | 749, 76 | 767, 77 | 773, 78 | 779, 79 | 795, 80 | 796, 81 | 800, 82 | 804, 83 | 812, 84 | 813, 85 | 829, 86 | 834, 87 | 835, 88 | 844, 89 | 846, 90 | 861, 91 | 871, 92 | 881, 93 | 882, 94 | 886, 95 | 891, 96 | 892, 97 | 900, 98 | 912, 99 | 913, 100 | 916, 101 | 928, 102 | 936, 103 | 942, 104 | 946, 105 | 950, 106 | 967, 107 | 968, 108 | 1004, 109 | 1014, 110 | 1019, 111 | 1023, 112 | 1033, 113 | 1054, 114 | 1060, 115 | 1063, 116 | 1070, 117 | 1078, 118 | 1079, 119 | 1100, 120 | 1115, 121 | 1137, 122 | 1139, 123 | 1155, 124 | 1163, 125 | 1206, 126 | 1209, 127 | 1227, 128 | 1235, 129 | 1241, 130 | 1250, 131 | 1261, 132 | 1263, 133 | 1287, 134 | 1290, 135 | 1325, 136 | 1352, 137 | 1353, 138 | 1364, 139 | 1368, 140 | 1369, 141 | 1374, 142 | 1381, 143 | 1382, 144 | 1388, 145 | 1401, 146 | 1450, 147 | 1472, 148 | 1485, 149 | 1496, 150 | 1498, 151 | 1500, 152 | 1501, 153 | 1512, 154 | 1515, 155 | 1517, 156 | 1527, 157 | 1528, 158 | 1553, 159 | 1563, 160 | 1565, 161 | 1566, 162 | 1599, 163 | 1614, 164 | 1624, 165 | 1657, 166 | 1663, 167 | 1677, 168 | 1694, 169 | 1713, 170 | 1732, 171 | 1737, 172 | 1744, 173 | 1755, 174 | 1766, 175 | 1770, 176 | 1777, 177 | 1778, 178 | 1801, 179 | 1805, 180 | 1809, 181 | 1819, 182 | 1826, 183 | 1828, 184 | 1829, 185 | 1841, 186 | 1847, 187 | 1849, 188 | 1850 189 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 4, 4 | 6, 5 | 8, 6 | 11, 7 | 13, 8 | 19, 9 | 21, 10 | 40, 11 | 48, 12 | 50, 13 | 56, 14 | 62, 15 | 65, 16 | 118, 17 | 119, 18 | 126, 19 | 145, 20 | 153, 21 | 155, 22 | 167, 23 | 171, 24 | 184, 25 | 188, 26 | 213, 27 | 224, 28 | 244, 29 | 259, 30 | 268, 31 | 308, 32 | 312, 33 | 315, 34 | 325, 35 | 339, 36 | 393, 37 | 394, 38 | 397, 39 | 411, 40 | 427, 41 | 436, 42 | 439, 43 | 447, 44 | 450, 45 | 457, 46 | 461, 47 | 466, 48 | 490, 49 | 492, 50 | 494, 51 | 498, 52 | 507, 53 | 508, 54 | 514, 55 | 519, 56 | 523, 57 | 532, 58 | 542, 59 | 544, 60 | 551, 61 | 572, 62 | 573, 63 | 623, 64 | 634, 65 | 636 66 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 43, 3 | 54, 4 | 55, 5 | 72, 6 | 73, 7 | 74, 8 | 83, 9 | 89, 10 | 94, 11 | 98, 12 | 109, 13 | 114, 14 | 127, 15 | 136, 16 | 142, 17 | 146, 18 | 157, 19 | 163, 20 | 164, 21 | 169, 22 | 202, 23 | 219, 24 | 220, 25 | 231, 26 | 234, 27 | 237, 28 | 246, 29 | 247, 30 | 250, 31 | 251, 32 | 266, 33 | 276, 34 | 289, 35 | 292, 36 | 304, 37 | 329, 38 | 336, 39 | 363, 40 | 367, 41 | 369, 42 | 371, 43 | 374, 44 | 375, 45 | 414, 46 | 425, 47 | 449, 48 | 453, 49 | 474, 50 | 481, 51 | 500, 52 | 505, 53 | 515, 54 | 530, 55 | 540, 56 | 545, 57 | 552, 58 | 574, 59 | 584, 60 | 596, 61 | 598, 62 | 602, 63 | 629 64 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 5, 3 | 33, 4 | 66, 5 | 80, 6 | 99, 7 | 107, 8 | 110, 9 | 116, 10 | 120, 11 | 125, 12 | 128, 13 | 133, 14 | 138, 15 | 149, 16 | 161, 17 | 168, 18 | 176, 19 | 182, 20 | 193, 21 | 204, 22 | 226, 23 | 248, 24 | 253, 25 | 256, 26 | 272, 27 | 273, 28 | 277, 29 | 286, 30 | 297, 31 | 301, 32 | 303, 33 | 305, 34 | 310, 35 | 321, 36 | 348, 37 | 349, 38 | 350, 39 | 358, 40 | 372, 41 | 387, 42 | 403, 43 | 417, 44 | 418, 45 | 428, 46 | 443, 47 | 462, 48 | 502, 49 | 503, 50 | 512, 51 | 531, 52 | 537, 53 | 539, 54 | 541, 55 | 560, 56 | 568, 57 | 569, 58 | 575, 59 | 583, 60 | 585, 61 | 586, 62 | 593, 63 | 597, 64 | 603, 65 | 611, 66 | 612, 67 | 617, 68 | 631 69 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 15, 4 | 17, 5 | 23, 6 | 25, 7 | 28, 8 | 29, 9 | 34, 10 | 38, 11 | 52, 12 | 58, 13 | 60, 14 | 71, 15 | 77, 16 | 104, 17 | 115, 18 | 129, 19 | 131, 20 | 135, 21 | 150, 22 | 199, 23 | 221, 24 | 222, 25 | 227, 26 | 233, 27 | 242, 28 | 243, 29 | 260, 30 | 274, 31 | 284, 32 | 288, 33 | 291, 34 | 298, 35 | 302, 36 | 307, 37 | 327, 38 | 334, 39 | 352, 40 | 354, 41 | 355, 42 | 359, 43 | 368, 44 | 376, 45 | 378, 46 | 381, 47 | 382, 48 | 384, 49 | 389, 50 | 390, 51 | 395, 52 | 416, 53 | 421, 54 | 423, 55 | 432, 56 | 444, 57 | 448, 58 | 460, 59 | 463, 60 | 468, 61 | 469, 62 | 493, 63 | 495, 64 | 556, 65 | 563, 66 | 567, 67 | 577, 68 | 580, 69 | 589, 70 | 591, 71 | 605, 72 | 607, 73 | 608, 74 | 619, 75 | 633 76 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 14, 4 | 30, 5 | 37, 6 | 57, 7 | 64, 8 | 67, 9 | 79, 10 | 82, 11 | 85, 12 | 87, 13 | 91, 14 | 103, 15 | 111, 16 | 141, 17 | 144, 18 | 152, 19 | 174, 20 | 175, 21 | 179, 22 | 197, 23 | 200, 24 | 205, 25 | 207, 26 | 216, 27 | 232, 28 | 238, 29 | 265, 30 | 296, 31 | 306, 32 | 335, 33 | 337, 34 | 341, 35 | 343, 36 | 347, 37 | 353, 38 | 357, 39 | 366, 40 | 379, 41 | 380, 42 | 392, 43 | 400, 44 | 402, 45 | 422, 46 | 434, 47 | 435, 48 | 456, 49 | 458, 50 | 471, 51 | 489, 52 | 506, 53 | 509, 54 | 513, 55 | 550, 56 | 553, 57 | 557, 58 | 559, 59 | 565, 60 | 595, 61 | 615, 62 | 616, 63 | 635, 64 | 637 65 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 10, 3 | 18, 4 | 22, 5 | 31, 6 | 36, 7 | 47, 8 | 68, 9 | 69, 10 | 84, 11 | 90, 12 | 97, 13 | 105, 14 | 112, 15 | 113, 16 | 117, 17 | 130, 18 | 147, 19 | 159, 20 | 160, 21 | 166, 22 | 178, 23 | 180, 24 | 185, 25 | 189, 26 | 190, 27 | 210, 28 | 215, 29 | 217, 30 | 223, 31 | 229, 32 | 230, 33 | 236, 34 | 255, 35 | 269, 36 | 313, 37 | 316, 38 | 328, 39 | 333, 40 | 345, 41 | 356, 42 | 364, 43 | 365, 44 | 377, 45 | 385, 46 | 398, 47 | 399, 48 | 412, 49 | 413, 50 | 441, 51 | 445, 52 | 446, 53 | 476, 54 | 479, 55 | 510, 56 | 520, 57 | 548, 58 | 555, 59 | 576, 60 | 579, 61 | 587, 62 | 592, 63 | 594, 64 | 606, 65 | 613, 66 | 622, 67 | 625, 68 | 626, 69 | 632, 70 | 640 71 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 7, 4 | 12, 5 | 16, 6 | 20, 7 | 35, 8 | 76, 9 | 88, 10 | 92, 11 | 102, 12 | 108, 13 | 123, 14 | 137, 15 | 148, 16 | 170, 17 | 177, 18 | 195, 19 | 196, 20 | 203, 21 | 208, 22 | 211, 23 | 214, 24 | 241, 25 | 245, 26 | 254, 27 | 280, 28 | 281, 29 | 283, 30 | 285, 31 | 293, 32 | 295, 33 | 309, 34 | 311, 35 | 338, 36 | 342, 37 | 370, 38 | 391, 39 | 431, 40 | 442, 41 | 452, 42 | 465, 43 | 473, 44 | 511, 45 | 528, 46 | 533, 47 | 534, 48 | 549, 49 | 558, 50 | 561, 51 | 571, 52 | 581, 53 | 588, 54 | 610, 55 | 620, 56 | 641 57 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 9, 3 | 39, 4 | 45, 5 | 49, 6 | 51, 7 | 53, 8 | 70, 9 | 75, 10 | 106, 11 | 121, 12 | 134, 13 | 140, 14 | 151, 15 | 158, 16 | 172, 17 | 181, 18 | 183, 19 | 187, 20 | 194, 21 | 201, 22 | 209, 23 | 225, 24 | 264, 25 | 270, 26 | 278, 27 | 290, 28 | 317, 29 | 318, 30 | 326, 31 | 344, 32 | 351, 33 | 383, 34 | 388, 35 | 396, 36 | 408, 37 | 410, 38 | 415, 39 | 419, 40 | 420, 41 | 455, 42 | 464, 43 | 484, 44 | 488, 45 | 491, 46 | 496, 47 | 501, 48 | 517, 49 | 521, 50 | 522, 51 | 524, 52 | 525, 53 | 538, 54 | 562, 55 | 582, 56 | 600, 57 | 601, 58 | 604, 59 | 614, 60 | 638 61 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 27, 3 | 42, 4 | 46, 5 | 61, 6 | 78, 7 | 86, 8 | 93, 9 | 95, 10 | 96, 11 | 139, 12 | 186, 13 | 191, 14 | 198, 15 | 206, 16 | 212, 17 | 218, 18 | 235, 19 | 252, 20 | 258, 21 | 261, 22 | 294, 23 | 314, 24 | 320, 25 | 322, 26 | 323, 27 | 330, 28 | 331, 29 | 340, 30 | 346, 31 | 360, 32 | 386, 33 | 404, 34 | 405, 35 | 406, 36 | 424, 37 | 426, 38 | 429, 39 | 430, 40 | 433, 41 | 437, 42 | 440, 43 | 454, 44 | 467, 45 | 470, 46 | 472, 47 | 475, 48 | 477, 49 | 478, 50 | 482, 51 | 483, 52 | 485, 53 | 487, 54 | 497, 55 | 504, 56 | 516, 57 | 518, 58 | 526, 59 | 527, 60 | 529, 61 | 535, 62 | 546, 63 | 554, 64 | 564, 65 | 566, 66 | 578, 67 | 590, 68 | 609, 69 | 621, 70 | 624, 71 | 630, 72 | 639 73 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/opensubtitles/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 24, 3 | 26, 4 | 32, 5 | 41, 6 | 44, 7 | 59, 8 | 63, 9 | 81, 10 | 100, 11 | 101, 12 | 122, 13 | 124, 14 | 132, 15 | 143, 16 | 154, 17 | 156, 18 | 162, 19 | 165, 20 | 173, 21 | 192, 22 | 228, 23 | 239, 24 | 240, 25 | 249, 26 | 257, 27 | 262, 28 | 263, 29 | 267, 30 | 271, 31 | 275, 32 | 279, 33 | 282, 34 | 287, 35 | 299, 36 | 300, 37 | 319, 38 | 324, 39 | 332, 40 | 361, 41 | 362, 42 | 373, 43 | 401, 44 | 407, 45 | 409, 46 | 438, 47 | 451, 48 | 459, 49 | 480, 50 | 486, 51 | 499, 52 | 536, 53 | 543, 54 | 547, 55 | 570, 56 | 599, 57 | 618, 58 | 627, 59 | 628 60 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group0.json: -------------------------------------------------------------------------------- 1 | [ 2 | 2, 3 | 4, 4 | 20, 5 | 30, 6 | 57, 7 | 61, 8 | 66, 9 | 79, 10 | 82, 11 | 94, 12 | 126, 13 | 142, 14 | 150, 15 | 155, 16 | 157, 17 | 164, 18 | 167, 19 | 169, 20 | 175, 21 | 198, 22 | 205, 23 | 206, 24 | 222, 25 | 233, 26 | 248, 27 | 249, 28 | 252, 29 | 282, 30 | 294, 31 | 302, 32 | 310, 33 | 316, 34 | 322, 35 | 323 36 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group1.json: -------------------------------------------------------------------------------- 1 | [ 2 | 19, 3 | 41, 4 | 45, 5 | 52, 6 | 64, 7 | 74, 8 | 75, 9 | 80, 10 | 83, 11 | 89, 12 | 91, 13 | 97, 14 | 112, 15 | 130, 16 | 131, 17 | 134, 18 | 141, 19 | 143, 20 | 147, 21 | 180, 22 | 201, 23 | 203, 24 | 210, 25 | 212, 26 | 223, 27 | 250, 28 | 285, 29 | 309, 30 | 311, 31 | 331 32 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group2.json: -------------------------------------------------------------------------------- 1 | [ 2 | 1, 3 | 5, 4 | 12, 5 | 18, 6 | 34, 7 | 35, 8 | 50, 9 | 71, 10 | 77, 11 | 92, 12 | 118, 13 | 123, 14 | 124, 15 | 127, 16 | 133, 17 | 135, 18 | 159, 19 | 160, 20 | 162, 21 | 166, 22 | 174, 23 | 196, 24 | 221, 25 | 232, 26 | 251, 27 | 261, 28 | 271, 29 | 284, 30 | 290, 31 | 304, 32 | 314, 33 | 319, 34 | 339 35 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group3.json: -------------------------------------------------------------------------------- 1 | [ 2 | 10, 3 | 37, 4 | 42, 5 | 47, 6 | 51, 7 | 68, 8 | 81, 9 | 84, 10 | 98, 11 | 99, 12 | 105, 13 | 107, 14 | 108, 15 | 129, 16 | 136, 17 | 187, 18 | 189, 19 | 190, 20 | 246, 21 | 265, 22 | 274, 23 | 275, 24 | 283, 25 | 286, 26 | 292, 27 | 307, 28 | 327, 29 | 334, 30 | 338 31 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group4.json: -------------------------------------------------------------------------------- 1 | [ 2 | 0, 3 | 21, 4 | 25, 5 | 26, 6 | 27, 7 | 58, 8 | 59, 9 | 62, 10 | 101, 11 | 116, 12 | 120, 13 | 122, 14 | 125, 15 | 128, 16 | 161, 17 | 184, 18 | 193, 19 | 195, 20 | 199, 21 | 200, 22 | 213, 23 | 217, 24 | 219, 25 | 238, 26 | 242, 27 | 244, 28 | 245, 29 | 254, 30 | 277, 31 | 288, 32 | 295, 33 | 308, 34 | 324, 35 | 325, 36 | 328, 37 | 340 38 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group5.json: -------------------------------------------------------------------------------- 1 | [ 2 | 3, 3 | 11, 4 | 22, 5 | 23, 6 | 33, 7 | 44, 8 | 46, 9 | 48, 10 | 69, 11 | 70, 12 | 85, 13 | 86, 14 | 113, 15 | 114, 16 | 132, 17 | 145, 18 | 176, 19 | 182, 20 | 185, 21 | 202, 22 | 204, 23 | 218, 24 | 227, 25 | 231, 26 | 259, 27 | 266, 28 | 293, 29 | 298, 30 | 305 31 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group6.json: -------------------------------------------------------------------------------- 1 | [ 2 | 28, 3 | 32, 4 | 38, 5 | 40, 6 | 65, 7 | 72, 8 | 90, 9 | 102, 10 | 117, 11 | 146, 12 | 151, 13 | 163, 14 | 168, 15 | 177, 16 | 192, 17 | 194, 18 | 216, 19 | 260, 20 | 263, 21 | 278, 22 | 280, 23 | 301, 24 | 303, 25 | 317, 26 | 321, 27 | 330, 28 | 341 29 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group7.json: -------------------------------------------------------------------------------- 1 | [ 2 | 7, 3 | 13, 4 | 15, 5 | 16, 6 | 17, 7 | 63, 8 | 73, 9 | 93, 10 | 96, 11 | 104, 12 | 111, 13 | 115, 14 | 119, 15 | 121, 16 | 137, 17 | 139, 18 | 156, 19 | 165, 20 | 172, 21 | 179, 22 | 181, 23 | 211, 24 | 229, 25 | 234, 26 | 255, 27 | 256, 28 | 262, 29 | 289, 30 | 326, 31 | 333, 32 | 336 33 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group8.json: -------------------------------------------------------------------------------- 1 | [ 2 | 6, 3 | 14, 4 | 29, 5 | 49, 6 | 53, 7 | 54, 8 | 55, 9 | 60, 10 | 67, 11 | 87, 12 | 88, 13 | 95, 14 | 103, 15 | 109, 16 | 138, 17 | 144, 18 | 148, 19 | 152, 20 | 154, 21 | 158, 22 | 171, 23 | 178, 24 | 188, 25 | 197, 26 | 207, 27 | 209, 28 | 220, 29 | 235, 30 | 236, 31 | 237, 32 | 240, 33 | 241, 34 | 243, 35 | 247, 36 | 258, 37 | 267, 38 | 268, 39 | 270, 40 | 273, 41 | 276, 42 | 287, 43 | 291, 44 | 296, 45 | 315, 46 | 332, 47 | 335 48 | ] -------------------------------------------------------------------------------- /assets/test_subsample_indices/youtubesubtitles/group9.json: -------------------------------------------------------------------------------- 1 | [ 2 | 8, 3 | 9, 4 | 24, 5 | 31, 6 | 36, 7 | 39, 8 | 43, 9 | 56, 10 | 76, 11 | 78, 12 | 100, 13 | 106, 14 | 110, 15 | 140, 16 | 149, 17 | 153, 18 | 170, 19 | 173, 20 | 183, 21 | 186, 22 | 191, 23 | 208, 24 | 214, 25 | 215, 26 | 224, 27 | 225, 28 | 226, 29 | 228, 30 | 230, 31 | 239, 32 | 253, 33 | 257, 34 | 264, 35 | 269, 36 | 272, 37 | 279, 38 | 281, 39 | 297, 40 | 299, 41 | 300, 42 | 306, 43 | 312, 44 | 313, 45 | 318, 46 | 320, 47 | 329, 48 | 337 49 | ] -------------------------------------------------------------------------------- /lm_perplexity/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAI/lm_perplexity/24c5a04beb2f073b2230c7c7420bd1ec7776f513/lm_perplexity/__init__.py -------------------------------------------------------------------------------- /lm_perplexity/compute_perplexity.py: -------------------------------------------------------------------------------- 1 | import argparse 2 | import json 3 | import numpy as np 4 | import torch 5 | 6 | 7 | def parse_args(): 8 | parser = argparse.ArgumentParser() 9 | parser.add_argument('--perplexity_data_path', required=True) 10 | parser.add_argument('--utf8_conversion_scalar', default=None, type=float) 11 | parser.add_argument('--output_path', default=None) 12 | return parser.parse_args() 13 | 14 | 15 | def main(): 16 | args = parse_args() 17 | perplexity_data = torch.load(args.perplexity_data_path) 18 | aggregate_logprobs = np.concatenate(perplexity_data["all_logprobs"]) 19 | perplexity = np.exp(-aggregate_logprobs.mean()) 20 | result = { 21 | "perplexity": float(perplexity) 22 | } 23 | if args.utf8_conversion_scalar is not None: 24 | result["bpb"] = float(np.log2(perplexity) * args.utf8_conversion_scalar) 25 | if args.output_path: 26 | with open(args.output_path, "w") as f: 27 | f.write(json.dumps(result, indent=2)) 28 | else: 29 | print(json.dumps(result, indent=2)) 30 | 31 | 32 | if __name__ == "__main__": 33 | main() 34 | -------------------------------------------------------------------------------- /lm_perplexity/save_lm_perplexity_data.py: -------------------------------------------------------------------------------- 1 | import argparse 2 | import torch 3 | from tqdm import auto as tqdm_lib 4 | 5 | import lm_dataformat 6 | import lm_perplexity.models as models 7 | import lm_perplexity.utils as utils 8 | 9 | 10 | def parse_args(): 11 | parser = argparse.ArgumentParser() 12 | parser.add_argument('--model_config_path', required=True) 13 | parser.add_argument('--data_path', required=True) 14 | parser.add_argument('--output_path', required=True) 15 | parser.add_argument('--max_docs', type=int, default=None) 16 | parser.add_argument('--doc_indices_path', type=str, default=None) 17 | return parser.parse_args() 18 | 19 | 20 | def compute_perplexity_data(model, data_path, indices=None): 21 | # For expedience, we're going to assume everything fits in memory for now 22 | # Also for expedience we're just going to save lists of arrays 23 | overall_output = { 24 | "all_logprobs": [], 25 | "all_positions": [], 26 | "aggregate_length": 0, 27 | "aggregate_utf8_length": 0. 28 | } 29 | 30 | reader = lm_dataformat.Reader(data_path) 31 | for i, doc in enumerate(tqdm_lib.tqdm(reader.stream_data())): 32 | if indices is not None and i not in indices: 33 | continue 34 | output = model.get_perplexity_data(doc) 35 | if not output: 36 | continue 37 | overall_output["all_logprobs"].append(output["logprobs"]) 38 | overall_output["all_positions"].append(output["positions"]) 39 | overall_output["aggregate_length"] += output["length"] 40 | overall_output["aggregate_utf8_length"] += output["utf8_length"] 41 | 42 | return overall_output 43 | 44 | 45 | def main(): 46 | args = parse_args() 47 | model = models.create_model(args.model_config_path) 48 | if args.doc_indices_path: 49 | assert args.max_docs is None 50 | indices = set(utils.read_json(args.doc_indices_path)) 51 | elif args.max_docs: 52 | assert args.doc_indices_path is None 53 | indices = set(range(args.max_docs)) 54 | else: 55 | indices = None 56 | perplexity_data = compute_perplexity_data( 57 | model=model, 58 | data_path=args.data_path, 59 | indices=indices, 60 | ) 61 | torch.save(perplexity_data, args.output_path) 62 | 63 | 64 | if __name__ == "__main__": 65 | main() 66 | -------------------------------------------------------------------------------- /lm_perplexity/utils.py: -------------------------------------------------------------------------------- 1 | import contextlib 2 | import json 3 | import time 4 | 5 | WB_MAX_IN_TIME_SPAN = 600 6 | WB_TIME_SPAN = 60 7 | 8 | 9 | def read_json(path, **kwargs): 10 | with open(path, mode="r", **kwargs) as f: 11 | return json.loads(f.read()) 12 | 13 | 14 | def write_json(data, path, **kwargs): 15 | with open(path, mode="w", **kwargs) as f: 16 | f.write(json.dumps(data)) 17 | 18 | 19 | def get_rolling_token_windows(token_list, prefix_token, max_seq_len, context_len): 20 | """ 21 | - context_len allows for a rolling window context, allowing each prediction window to potentially 22 | condition on some context 23 | 24 | :param token_list: list 25 | List of tokens to be PREDICTED 26 | :param max_seq_len: int 27 | max_seq_len of model (or max_seq_len we want to use) 28 | :param context_len: int 29 | Amount of desired token context for prediction. Needs to be at least 1. 30 | :param prefix_token: token 31 | Dummy token like so the first token has something to condition on 32 | :return: generator 33 | Generator of tuples 34 | (input_tokens, pred_tokens) 35 | Note: Score only the last len(pred_tokens) logits of the LM 36 | """ 37 | assert 1 <= context_len <= max_seq_len 38 | if not token_list: 39 | return 40 | # +1 offset, going from input->preds 41 | pred_len = max_seq_len - context_len + 1 42 | predicted = 0 43 | 44 | # Special handling for first window: predict all tokens 45 | first_seq_len = min(max_seq_len, len(token_list)) 46 | yield ( 47 | [prefix_token] + token_list[:first_seq_len - 1], 48 | token_list[:first_seq_len] 49 | ) 50 | predicted += first_seq_len 51 | 52 | while predicted < len(token_list): 53 | window_pred_len = min(len(token_list) - predicted, pred_len) 54 | window_end = predicted + window_pred_len 55 | yield ( 56 | token_list[window_end - max_seq_len - 1:window_end - 1], 57 | token_list[window_end - window_pred_len:window_end], 58 | ) 59 | predicted += window_pred_len 60 | 61 | 62 | class WaitBlocker: 63 | def __init__(self, backoff=1, verbose=True, max_in_time_span=WB_MAX_IN_TIME_SPAN, time_span=WB_TIME_SPAN): 64 | self.backoff = backoff 65 | self.verbose = verbose 66 | self.max_in_time_span = max_in_time_span 67 | self.time_span = time_span 68 | self.record = [] 69 | 70 | def wait_until_valid(self): 71 | i = 0 72 | now = time.time() 73 | for i in range(len(self.record)): 74 | if self.record[i] > now - self.time_span: 75 | break 76 | self.record = self.record[i:] 77 | if len(self.record) >= self.max_in_time_span: 78 | delta = self.record[i] - now + self.time_span 79 | print(f"Backing off for {delta:.1f}") 80 | time.sleep(delta) 81 | 82 | def add_record(self): 83 | self.record.append(time.time()) 84 | 85 | @contextlib.contextmanager 86 | def check_valid(self): 87 | self.wait_until_valid() 88 | yield 89 | self.add_record() 90 | -------------------------------------------------------------------------------- /preset_configs/gpt2_large.json: -------------------------------------------------------------------------------- 1 | { 2 | "model_type": "gpt2", 3 | "model_name": "gpt2-large", 4 | "context_len": 1, 5 | "device": "cuda:0" 6 | } -------------------------------------------------------------------------------- /preset_configs/gpt2_medium.json: -------------------------------------------------------------------------------- 1 | { 2 | "model_type": "gpt2", 3 | "model_name": "gpt2-medium", 4 | "context_len": 1, 5 | "device": "cuda:0" 6 | } -------------------------------------------------------------------------------- /preset_configs/gpt2_small.json: -------------------------------------------------------------------------------- 1 | { 2 | "model_type": "gpt2", 3 | "model_name": "gpt2", 4 | "context_len": 1, 5 | "device": "cuda:0" 6 | } -------------------------------------------------------------------------------- /preset_configs/gpt2_xl.json: -------------------------------------------------------------------------------- 1 | { 2 | "model_type": "gpt2", 3 | "model_name": "gpt2-xl", 4 | "context_len": 1, 5 | "device": "cuda:0" 6 | } -------------------------------------------------------------------------------- /preset_configs/gpt3_ada.json: -------------------------------------------------------------------------------- 1 | { 2 | "model_type": "gpt3", 3 | "engine": "ada", 4 | "context_len": 1 5 | } -------------------------------------------------------------------------------- /preset_configs/gpt3_babbage.json: -------------------------------------------------------------------------------- 1 | { 2 | "model_type": "gpt3", 3 | "engine": "babbage", 4 | "context_len": 1 5 | } -------------------------------------------------------------------------------- /preset_configs/gpt3_curie.json: -------------------------------------------------------------------------------- 1 | { 2 | "model_type": "gpt3", 3 | "engine": "curie", 4 | "context_len": 1 5 | } -------------------------------------------------------------------------------- /preset_configs/gpt3_davinci.json: -------------------------------------------------------------------------------- 1 | { 2 | "model_type": "gpt3", 3 | "engine": "davinci", 4 | "context_len": 1 5 | } -------------------------------------------------------------------------------- /scripts/export_test_splits.py: -------------------------------------------------------------------------------- 1 | import argparse 2 | from collections import Counter 3 | from tqdm import auto as tqdm_lib 4 | 5 | import requests 6 | import os 7 | import json 8 | import gzip 9 | from best_download import download_file 10 | from lm_dataformat import Reader, Archive 11 | 12 | 13 | def parse_args(): 14 | parser = argparse.ArgumentParser() 15 | parser.add_argument('--output_dir', required=True) 16 | parser.add_argument('--group_num', type=int, default=0) 17 | return parser.parse_args() 18 | 19 | 20 | DATASET_NAMES_DICT = { 21 | "Github": "github", 22 | "ArXiv": "arxiv", 23 | "Wikipedia (en)": "wikipedia", 24 | "OpenSubtitles": "opensubtitles", 25 | "OpenWebText2": "openwebtext2", 26 | "Gutenberg (PG-19)": "gutenberg", 27 | "DM Mathematics": "dm-mathematics", 28 | "Enron Emails": "enron", 29 | "Books3": "bibliotik", 30 | "PubMed Abstracts": "pubmed-abstracts", 31 | "YoutubeSubtitles": "youtubesubtitles", 32 | "HackerNews": "hackernews", 33 | "Pile-CC": "commoncrawl", 34 | "EuroParl": "europarl", 35 | "USPTO Backgrounds": "uspto", 36 | "FreeLaw": "freelaw", 37 | "NIH ExPorter": "nih-exporter", 38 | "StackExchange": "stackexchange", 39 | "PubMed Central": "pubmed-central", 40 | "Ubuntu IRC": "ubuntu-irc", 41 | "BookCorpus2": "bookcorpus", 42 | "PhilPapers": "philpapers", 43 | } 44 | 45 | # These datasets were too small (in number of docs) to split 10-ways 46 | DATASETS_WITHOUT_SPLIT = [ 47 | "ubuntu-irc", 48 | "bookcorpus", 49 | "philpapers", 50 | ] 51 | 52 | 53 | def main(): 54 | args = parse_args() 55 | os.makedirs(args.output_dir, exist_ok=True) 56 | test_data_path = os.path.join(args.output_dir, "test.jsonl.zst") 57 | if not os.path.exists(test_data_path): 58 | download_file("https://the-eye.eu/public/AI/pile/test.jsonl.zst", test_data_path) 59 | indices = {} 60 | for short_name in DATASET_NAMES_DICT.values(): 61 | if short_name not in DATASETS_WITHOUT_SPLIT: 62 | url = f"https://raw.githubusercontent.com/EleutherAI/lm_perplexity/main/assets/test_subsample_indices/{short_name}/group{args.group_num}.json" 63 | indices[short_name] = set(requests.get(url).json()) 64 | with gzip.open(os.path.join(args.output_dir, f"test_group_{args.group_num}.jsonl.gz"), "wt") as f: 65 | reader = Reader(test_data_path) 66 | counter = Counter() 67 | for text, meta in tqdm_lib.tqdm(reader.stream_data(get_meta=True)): 68 | short_name = DATASET_NAMES_DICT[meta["pile_set_name"]] 69 | if short_name in DATASETS_WITHOUT_SPLIT: 70 | do_write = True 71 | elif counter[short_name] in indices[short_name]: 72 | do_write = True 73 | else: 74 | do_write = False 75 | if do_write: 76 | f.write(json.dumps({"text": text, "name": short_name}) + "\n") 77 | counter[short_name] += 1 78 | 79 | 80 | if __name__ == "__main__": 81 | main() 82 | -------------------------------------------------------------------------------- /tests/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/EleutherAI/lm_perplexity/24c5a04beb2f073b2230c7c7420bd1ec7776f513/tests/__init__.py --------------------------------------------------------------------------------