|
| 1 | +skip_dict = { |
| 2 | + "../../../../test/distributed/fsdp/test_fsdp_checkpoint.py": ( |
| 3 | + "test_checkpoint_fsdp_wrapping_cpu_offload0_offload_activations_False_use_orig_params_False", |
| 4 | + "test_checkpoint_fsdp_wrapping_cpu_offload1_offload_activations_False_use_orig_params_False", |
| 5 | + "test_checkpoint_fsdp_wrapping_cpu_offload1_offload_activations_True_use_orig_params_False", |
| 6 | + "test_checkpoint_submodule_use_reentrant_False_xpu", |
| 7 | + ), |
| 8 | + "../../../../test/distributed/fsdp/test_fsdp_apply.py": None, |
| 9 | + "../../../../test/distributed/fsdp/test_fsdp_clip_grad_norm.py": ( |
| 10 | + "test_ddp_parity_xpu", |
| 11 | + ), |
| 12 | + "../../../../test/distributed/fsdp/test_fsdp_comm.py": None, |
| 13 | + "../../../../test/distributed/fsdp/test_fsdp_core.py": ( |
| 14 | + "test_delayed_optim_step_offload_false_no_shard_xpu", |
| 15 | + "test_delayed_optim_step_offload_false_none_xpu", |
| 16 | + "test_delayed_optim_step_offload_false_shard_grad_op_xpu", |
| 17 | + "test_delayed_optim_step_offload_true_none_xpu", |
| 18 | + "test_delayed_optim_step_offload_true_shard_grad_op_xpu", |
| 19 | + "test_delayed_reduce_scatter_offload_false_no_shard_xpu", |
| 20 | + "test_delayed_reduce_scatter_offload_false_none_xpu", |
| 21 | + "test_delayed_reduce_scatter_offload_false_shard_grad_op_xpu", |
| 22 | + "test_delayed_reduce_scatter_offload_true_none_xpu", |
| 23 | + "test_delayed_reduce_scatter_offload_true_shard_grad_op_xpu", |
| 24 | + "test_mixture_of_experts_offload_false_no_shard_xpu", |
| 25 | + "test_mixture_of_experts_offload_false_none_xpu", |
| 26 | + "test_mixture_of_experts_offload_false_shard_grad_op_xpu", |
| 27 | + "test_mixture_of_experts_offload_true_none_xpu", |
| 28 | + "test_mixture_of_experts_offload_true_shard_grad_op_xpu", |
| 29 | + "test_mixture_of_experts_with_delay_before_free_offload_false_no_shard_xpu", |
| 30 | + "test_mixture_of_experts_with_delay_before_free_offload_false_none_xpu", |
| 31 | + "test_mixture_of_experts_with_delay_before_free_offload_false_shard_grad_op_xpu", |
| 32 | + "test_mixture_of_experts_with_delay_before_free_offload_true_none_xpu", |
| 33 | + "test_mixture_of_experts_with_delay_before_free_offload_true_shard_grad_op_xpu", |
| 34 | + "test_nested_always_wrap_model_offload_false_no_shard_xpu", |
| 35 | + "test_nested_always_wrap_model_offload_false_none_xpu", |
| 36 | + "test_nested_always_wrap_model_offload_false_shard_grad_op_xpu", |
| 37 | + "test_nested_always_wrap_model_offload_true_none_xpu", |
| 38 | + "test_nested_always_wrap_model_offload_true_shard_grad_op_xpu", |
| 39 | + "test_nested_wrapped_model_offload_false_no_shard_xpu", |
| 40 | + "test_nested_wrapped_model_offload_false_none_xpu", |
| 41 | + "test_nested_wrapped_model_offload_false_shard_grad_op_xpu", |
| 42 | + "test_nested_wrapped_model_offload_true_none_xpu", |
| 43 | + "test_nested_wrapped_model_offload_true_shard_grad_op_xpu", |
| 44 | + "test_transformer_offload_false_no_shard_xpu", |
| 45 | + "test_transformer_offload_false_none_xpu", |
| 46 | + "test_transformer_offload_false_shard_grad_op_xpu", |
| 47 | + "test_transformer_offload_true_none_xpu", |
| 48 | + "test_transformer_offload_true_shard_grad_op_xpu", |
| 49 | + # https://github.com/intel/torch-xpu-ops/issues/1475 |
| 50 | + "test_transformer_no_grad_mixed_precision_True_xpu", |
| 51 | + "test_transformer_no_grad_mixed_precision_False_xpu", |
| 52 | + ), |
| 53 | + # Will add them back after debugging |
| 54 | + # "../../../../test/distributed/fsdp/test_fsdp_dtensor_state_dict.py": ( |
| 55 | + # "test_dtensor_sharded_model_load_state_dict_offload_to_cpu_False_is_even_sharded_model_False_xpu", |
| 56 | + # "test_dtensor_sharded_model_load_state_dict_offload_to_cpu_False_is_even_sharded_model_True_xpu", |
| 57 | + # "test_dtensor_sharded_model_load_state_dict_offload_to_cpu_True_is_even_sharded_model_False_xpu", |
| 58 | + # "test_dtensor_sharded_model_load_state_dict_offload_to_cpu_True_is_even_sharded_model_True_xpu", |
| 59 | + # "test_dtensor_sharded_optim_load_state_dict_offload_to_cpu_False_is_even_sharded_model_False_xpu", |
| 60 | + # "test_dtensor_sharded_optim_load_state_dict_offload_to_cpu_False_is_even_sharded_model_True_xpu", |
| 61 | + # "test_dtensor_sharded_optim_load_state_dict_offload_to_cpu_True_is_even_sharded_model_False_xpu", |
| 62 | + # "test_dtensor_sharded_optim_load_state_dict_offload_to_cpu_True_is_even_sharded_model_True_xpu", |
| 63 | + # "test_dtensor_sharded_tensor_state_dict_identical_offload_to_cpu_False_is_even_sharded_model_False_xpu", |
| 64 | + # "test_dtensor_sharded_tensor_state_dict_identical_offload_to_cpu_False_is_even_sharded_model_True_xpu", |
| 65 | + # "test_dtensor_sharded_tensor_state_dict_identical_offload_to_cpu_True_is_even_sharded_model_False_xpu", |
| 66 | + # "test_dtensor_sharded_tensor_state_dict_identical_offload_to_cpu_True_is_even_sharded_model_True_xpu", |
| 67 | + # "test_fsdp_init_with_device_mesh_is_even_sharded_model_False_xpu", |
| 68 | + # "test_fsdp_init_with_device_mesh_is_even_sharded_model_True_xpu", |
| 69 | + # "test_raises_warning_or_errors_xpu", |
| 70 | + # ), |
| 71 | + "../../../../test/distributed/fsdp/test_fsdp_exec_order.py": None, |
| 72 | + "../../../../test/distributed/fsdp/test_fsdp_fine_tune.py": ( |
| 73 | + "test_parity_with_non_frozen_fsdp_xpu", |
| 74 | + "test_parity_with_ddp_xpu", |
| 75 | + ), |
| 76 | + "../../../../test/distributed/fsdp/test_fsdp_fx.py": None, |
| 77 | + "../../../../test/distributed/fsdp/test_fsdp_input.py": None, |
| 78 | + "../../../../test/distributed/fsdp/test_fsdp_multiple_forward.py": None, |
| 79 | + "../../../../test/distributed/fsdp/test_fsdp_multiple_wrapping.py": ( |
| 80 | + "test_transformer_no_grad_mixed_precision_True_xpu", |
| 81 | + ), |
| 82 | + "../../../../test/distributed/fsdp/test_fsdp_uneven.py": None, |
| 83 | + # Will add them back after debugging |
| 84 | + # "../../../../test/distributed/fsdp/test_hsdp_dtensor_state_dict.py": ( |
| 85 | + # "test_dtensor_sharded_model_load_state_dict_offload_to_cpu_False_xpu", |
| 86 | + # "test_dtensor_sharded_model_load_state_dict_offload_to_cpu_True_xpu", |
| 87 | + # "test_dtensor_sharded_optim_load_state_dict_offload_to_cpu_False_xpu", |
| 88 | + # "test_dtensor_sharded_optim_load_state_dict_offload_to_cpu_True_xpu", |
| 89 | + # "test_dtensor_sharded_tensor_state_dict_identical_offload_to_cpu_False_xpu", |
| 90 | + # "test_dtensor_sharded_tensor_state_dict_identical_offload_to_cpu_True_xpu", |
| 91 | + # "test_hsdp_init_with_device_mesh_xpu", |
| 92 | + # "test_root_module_is_not_FSDP_xpu", |
| 93 | + # ), |
| 94 | + "../../../../test/distributed/fsdp/test_utils.py": None, |
| 95 | +} |
0 commit comments