Skip to content

Commit a88ff4c

Browse files
authored
feat: Improve flights.* dataset reproducibility (#645)
1 parent 14cc146 commit a88ff4c

14 files changed

+1024
-751
lines changed

_data/flights.toml

+49
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,49 @@
1+
[[specs]]
2+
start = 2001-01-01
3+
end = 2001-03-31
4+
n_rows = 2_000
5+
suffix = ".json"
6+
dt_format = "%Y/%m/%d %H:%M"
7+
8+
[[specs]]
9+
start = 2001-01-01
10+
end = 2001-03-31
11+
n_rows = 5_000
12+
suffix = ".json"
13+
dt_format = "%Y/%m/%d %H:%M"
14+
15+
[[specs]]
16+
start = 2001-01-01
17+
end = 2001-03-31
18+
n_rows = 10_000
19+
suffix = ".json"
20+
dt_format = "%Y/%m/%d %H:%M"
21+
22+
[[specs]]
23+
start = 2001-01-01
24+
end = 2001-03-31
25+
n_rows = 20_000
26+
suffix = ".json"
27+
dt_format = "%Y/%m/%d %H:%M"
28+
29+
[[specs]]
30+
start = 2001-01-01
31+
end = 2001-03-31
32+
n_rows = 200_000
33+
suffix = ".json"
34+
dt_format = "decimal"
35+
columns = ["delay", "distance", "time"]
36+
37+
[[specs]]
38+
start = 2001-01-01
39+
end = 2001-03-31
40+
n_rows = 200_000
41+
suffix = ".arrow"
42+
dt_format = "decimal"
43+
columns = ["delay", "distance", "time"]
44+
45+
[[specs]]
46+
start = 2001-01-01
47+
end = 2001-06-30
48+
n_rows = 3_000_000
49+
suffix = ".parquet"

data/flights-10k.json

+1-1
Large diffs are not rendered by default.

data/flights-200k.arrow

-1.27 MB
Binary file not shown.

data/flights-200k.json

+1-1
Large diffs are not rendered by default.

data/flights-20k.json

+1-1
Large diffs are not rendered by default.

data/flights-2k.json

+1-1
Large diffs are not rendered by default.

data/flights-3m.parquet

6.08 KB
Binary file not shown.

data/flights-5k.json

+1-1
Large diffs are not rendered by default.

datapackage.json

+1-1
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@
2020
}
2121
],
2222
"version": "2.11.0",
23-
"created": "2024-12-14T19:35:54.935236+00:00",
23+
"created": "2024-12-19T18:26:48.655674+00:00",
2424
"resources": [
2525
{
2626
"name": "7zip.png",

datapackage.md

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# vega-datasets
2-
`2.11.0` | [GitHub](http://github.com/vega/vega-datasets.git) | 2024-12-14 19:35:54 [UTC]
2+
`2.11.0` | [GitHub](http://github.com/vega/vega-datasets.git) | 2024-12-19 18:26:48 [UTC]
33

44
Common repository for example datasets used by Vega related projects.
55
BSD-3-Clause license applies only to package code and infrastructure. Users should verify their use of datasets

package.json

-1
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,6 @@
4646
"scripts": {
4747
"prebuild": "./scripts/make-url-index.sh > src/urls.ts && ./scripts/build_datapackage.py",
4848
"build": "rollup -c",
49-
"flights": "node scripts/flights.js",
5049
"github": "python scripts/github.py",
5150
"release": "release-it"
5251
}

pyproject.toml

+1-2
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,6 @@ dev = ["ipython[kernel]>=8.30.0", "ruff>=0.8.2", "taplo>=0.9.3"]
1919
extend-exclude = [
2020
".venv",
2121
"scripts/budget.py",
22-
"scripts/flights.py",
2322
"scripts/github.py",
2423
"scripts/make-unemployment-across-industries.py",
2524
"scripts/update_countries_json.py",
@@ -111,7 +110,7 @@ select = [
111110
[tool.pyright]
112111
enableExperimentalFeatures = true
113112
ignore = ["../../../**/Lib", ".venv"]
114-
include = ["./scripts/build_datapackage.py", "./scripts/flights2.py"]
113+
include = ["./scripts/build_datapackage.py", "./scripts/flights.py"]
115114
pythonPlatform = "All"
116115
pythonVersion = "3.12"
117116
reportUnusedExpression = "none"

scripts/flights.js

-33
This file was deleted.

0 commit comments

Comments
 (0)