Skip to content

Commit

Permalink
feat(DRAFT): Improve flights.* dataset reproducibility
Browse files Browse the repository at this point in the history
  • Loading branch information
dangotbanned committed Dec 10, 2024
1 parent efa018a commit ad1b862
Show file tree
Hide file tree
Showing 10 changed files with 1,623 additions and 5 deletions.
57 changes: 57 additions & 0 deletions _data/flights.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,57 @@
[[specs]]
# This spec won't be part of the final PR.
# Using it to demonstrate the deviation from [ISO_8601](https://en.wikipedia.org/wiki/ISO_8601)
range = [2001-01-01, 2001-03-31]
n_rows = 1_000
suffix = ".csv"
dt_format = "ISO"

[[specs]]
start = 2001-01-01
end = 2001-03-31
n_rows = 2_000
suffix = ".json"
dt_format = "iso"

[[specs]]
start = 2001-01-01
end = 2001-03-31
n_rows = 5_000
suffix = ".json"
dt_format = "iso"

[[specs]]
start = 2001-01-01
end = 2001-03-31
n_rows = 10_000
suffix = ".json"
dt_format = "iso"

[[specs]]
start = 2001-01-01
end = 2001-03-31
n_rows = 20_000
suffix = ".json"
dt_format = "iso"

[[specs]]
start = 2001-01-01
end = 2001-03-31
n_rows = 200_000
suffix = ".json"
dt_format = "decimal"
columns = ["delay", "distance", "time"]

[[specs]]
start = 2001-01-01
end = 2001-03-31
n_rows = 200_000
suffix = ".arrow"
dt_format = "decimal"
columns = ["delay", "distance", "time"]

[[specs]]
start = 2001-01-01
end = 2001-06-30
n_rows = 3_000_000
suffix = ".parquet"
2 changes: 1 addition & 1 deletion data/flights-10k.json

Large diffs are not rendered by default.

Loading

0 comments on commit ad1b862

Please sign in to comment.