@@ -525,11 +525,10 @@ def from_feurer(drop_missing: bool = True) -> 'Environments':
525
525
drop_missing: Exclude interactions with missing context features.
526
526
527
527
Remarks:
528
- The description of the benchmark is provided at https://arxiv.org/abs/2007.04074.
529
- For Task ids 232, 3044, 75105, and 211723 every row has a missing feature. These
530
- environments will be empty when drop_missing is True. Task id 189866 has been
531
- updated to 361282, a new version of the original dataset that fixes api issues
532
- with the old dataset.
528
+ The benchmark is described at https://arxiv.org/abs/2007.04074. For task ids
529
+ 232, 3044, 75105, and 211723 every row has a missing feature. These environments
530
+ will be empty when drop_missing is True. Task id 189866 has been removed due to an
531
+ OpenML issue (see https://github.com/openml/OpenML/issues/1036 for more information).
533
532
534
533
Returns:
535
534
An Environments object.
@@ -552,13 +551,84 @@ def from_feurer(drop_missing: bool = True) -> 'Environments':
552
551
167152 ,167161 ,167168 ,167181 ,167184 ,167185 ,167190 ,167200 ,167201 ,167202 ,167203 ,
553
552
167204 ,167205 ,168785 ,168791 ,168792 ,168793 ,168794 ,168795 ,168796 ,168797 ,168798 ,
554
553
189779 ,189786 ,189828 ,189829 ,189836 ,189840 ,189841 ,189843 ,189844 ,189845 ,189846 ,
555
- 189858 ,189859 ,189860 ,189861 ,189862 ,189863 ,189864 ,189865 ,361282 , 189869 ,189870 ,
554
+ 189858 ,189859 ,189860 ,189861 ,189862 ,189863 ,189864 ,189865 ,189869 ,189870 ,
556
555
189871 ,189872 ,189873 ,189874 ,189875 ,189878 ,189880 ,189881 ,189882 ,189883 ,189884 ,
557
556
189887 ,189890 ,189893 ,189894 ,189899 ,189900 ,189902 ,189905 ,189906 ,189908 ,189909 ,
558
557
190154 ,190155 ,190156 ,190157 ,190158 ,190159 ,211720 ,211721 ,211722 ,211723 ,211724 ]
559
558
560
559
return Environments .from_openml (task_id = task_ids ,drop_missing = drop_missing )
561
560
561
+ @staticmethod
562
+ def from_bietti (drop_missing : bool = True ) -> 'Environments' :
563
+ """Create Environments from the Bietti benchmark.
564
+
565
+ Args:
566
+ drop_missing: Exclude interactions with missing context features.
567
+
568
+ Remarks:
569
+ The benchmark is defined in https://www.jmlr.org/papers/volume22/18-863/18-863.pdf.
570
+
571
+ The benchmark has many datasets repeated with small variations such
572
+ as a multiclass version and a binary version. Some datasets have many
573
+ more variations than others (e.g., fri_c0_1000_10 has 79 variations).
574
+ This benchmark also has several synthetically generated datasets such as
575
+ RandomRBF_0_0, fri_c0_1000_10, and synthetic_control.
576
+
577
+ The following changes were made to the original data ids:
578
+ 1. 21 was replaced with a newer version 40975
579
+ 2. 292 was replaced with a newer version 40981
580
+ 3. 478 was replaced with a newer version 40971
581
+ 4. 822 was removed because it is an old version of 823
582
+ 5. 872 was removed because it is an old version of 853
583
+ 6. 948 was removed because it is an old version of 772
584
+ 7. 1036 was replaced with a newer version 40992
585
+ 8. 1043 was replaced with a newer version 40993
586
+ 9. 1454 was removed because it is a duplicate of 1049
587
+ 10. 1470 was replaced with a newer version 23381
588
+ 11. 1217 was removed because it is a subsample of 1216
589
+ 12. 1113 was remove because it is a subsample of 1110
590
+
591
+ Returns:
592
+ An Environments object.
593
+ """
594
+
595
+ data_ids = [3 ,6 ,10 ,11 ,12 ,14 ,16 ,18 ,20 ,22 ,23 ,26 ,28 ,30 ,31 ,32 ,36 ,37 ,39 ,40 ,41 ,43 ,44 ,46 ,
596
+ 48 ,50 ,53 ,54 ,59 ,60 ,61 ,62 ,150 ,151 ,153 ,154 ,155 ,156 ,157 ,158 ,159 ,160 ,161 ,162 ,
597
+ 180 ,181 ,182 ,183 ,184 ,187 ,273 ,275 ,276 ,277 ,278 ,279 ,285 ,293 ,300 ,307 ,310 ,312 ,313 ,
598
+ 329 ,333 ,334 ,335 ,336 ,337 ,338 ,339 ,343 ,346 ,351 ,354 ,357 ,375 ,377 ,383 ,384 ,385 ,386 ,
599
+ 387 ,388 ,389 ,390 ,391 ,392 ,393 ,394 ,395 ,396 ,397 ,398 ,399 ,400 ,401 ,444 ,446 ,448 ,450 ,
600
+ 457 ,458 ,459 ,461 ,462 ,463 ,464 ,465 ,467 ,468 ,469 ,472 ,475 ,476 ,477 ,479 ,480 ,554 ,
601
+ 679 ,682 ,683 ,685 ,694 ,713 ,714 ,715 ,716 ,717 ,718 ,719 ,720 ,721 ,722 ,723 ,724 ,725 ,
602
+ 726 ,727 ,728 ,729 ,730 ,731 ,732 ,733 ,734 ,735 ,736 ,737 ,740 ,741 ,742 ,743 ,744 ,745 ,746 ,
603
+ 747 ,748 ,749 ,750 ,751 ,752 ,753 ,754 ,755 ,756 ,758 ,759 ,761 ,762 ,763 ,764 ,765 ,766 ,767 ,
604
+ 768 ,769 ,770 ,771 ,772 ,773 ,774 ,775 ,776 ,777 ,778 ,779 ,780 ,782 ,783 ,784 ,785 ,787 ,788 ,
605
+ 789 ,790 ,791 ,792 ,793 ,794 ,795 ,796 ,797 ,799 ,800 ,801 ,803 ,804 ,805 ,806 ,807 ,808 ,811 ,
606
+ 812 ,813 ,814 ,815 ,816 ,817 ,818 ,819 ,820 ,821 ,823 ,824 ,825 ,826 ,827 ,828 ,829 ,830 ,
607
+ 832 ,833 ,834 ,835 ,836 ,837 ,838 ,841 ,843 ,845 ,846 ,847 ,848 ,849 ,850 ,851 ,853 ,855 ,857 ,
608
+ 859 ,860 ,862 ,863 ,864 ,865 ,866 ,867 ,868 ,869 ,870 ,871 ,873 ,874 ,875 ,876 ,877 ,878 ,
609
+ 879 ,880 ,881 ,882 ,884 ,885 ,886 ,888 ,891 ,892 ,893 ,894 ,895 ,896 ,900 ,901 ,902 ,903 ,904 ,
610
+ 905 ,906 ,907 ,908 ,909 ,910 ,911 ,912 ,913 ,914 ,915 ,916 ,917 ,918 ,919 ,920 ,921 ,922 ,923 ,
611
+ 924 ,925 ,926 ,927 ,928 ,929 ,931 ,932 ,933 ,934 ,935 ,936 ,937 ,938 ,941 ,942 ,943 ,945 ,946 ,
612
+ 947 ,949 ,950 ,951 ,952 ,953 ,954 ,955 ,956 ,958 ,959 ,962 ,964 ,965 ,969 ,970 ,971 ,973 ,
613
+ 974 ,976 ,977 ,978 ,979 ,980 ,983 ,987 ,988 ,991 ,994 ,995 ,996 ,997 ,1004 ,1005 ,1006 ,1009 ,
614
+ 1011 ,1012 ,1013 ,1014 ,1015 ,1016 ,1019 ,1020 ,1021 ,1022 ,1025 ,1026 ,1038 ,1040 ,1041 ,
615
+ 1044 ,1045 ,1046 ,1048 ,1049 ,1050 ,1054 ,1055 ,1056 ,1059 ,1060 ,1061 ,1062 ,1063 ,1064 ,
616
+ 1065 ,1066 ,1067 ,1068 ,1069 ,1071 ,1073 ,1075 ,1077 ,1078 ,1079 ,1080 ,1081 ,1082 ,1083 ,
617
+ 1084 ,1085 ,1086 ,1087 ,1088 ,1100 ,1104 ,1106 ,1107 ,1110 ,1113 ,1115 ,1116 ,1117 ,1120 ,
618
+ 1121 ,1122 ,1123 ,1124 ,1125 ,1126 ,1127 ,1128 ,1129 ,1130 ,1131 ,1132 ,1133 ,1135 ,1136 ,
619
+ 1137 ,1138 ,1139 ,1140 ,1141 ,1142 ,1143 ,1144 ,1145 ,1146 ,1147 ,1148 ,1149 ,1150 ,1151 ,
620
+ 1152 ,1153 ,1154 ,1155 ,1156 ,1157 ,1158 ,1159 ,1160 ,1161 ,1162 ,1163 ,1164 ,1165 ,1166 ,
621
+ 1169 ,1216 ,1217 ,1218 ,1233 ,1235 ,1236 ,1237 ,1238 ,1241 ,1242 ,1412 ,1413 ,1441 ,1442 ,
622
+ 1443 ,1444 ,1449 ,1451 ,1453 ,1455 ,1457 ,1459 ,1460 ,1464 ,1467 ,1471 ,1472 ,1473 ,1475 ,
623
+ 1481 ,1482 ,1483 ,1486 ,1487 ,1488 ,1489 ,1496 ,1498 ,1590 ,40975 ,40981 ,40971 ,23381 ]
624
+
625
+ env40992 = Environments .from_openml (data_id = 40992 ,target = 'label' ,drop_missing = drop_missing )
626
+ env40993 = Environments .from_openml (data_id = 40993 ,target = 'label' ,drop_missing = drop_missing )
627
+
628
+ return Environments .from_openml (data_id = data_ids ,drop_missing = drop_missing ) + env40992 + env40993
629
+
630
+
631
+
562
632
def __init__ (self , * environments : Union [Environment , Sequence [Environment ]]):
563
633
"""Instantiate an Environments class.
564
634
0 commit comments