|
|
|
|
|
|
| - version_range: "transformers 4.36 -> 4.45"
|
| affected_api: "Trainer.evaluate"
|
| description: "Trainer.evaluate() return type changed shape; metrics now nested under .metrics"
|
| breakage_primitive: "ChangeReturnType"
|
| params:
|
| function_name: "evaluate"
|
| old_access: "trainer.evaluate()"
|
| new_access: "trainer.evaluate().metrics"
|
| repair_primitive: "RestoreReturnAccess"
|
| category: "api_drift"
|
|
|
| - version_range: "transformers 4.30 -> 4.40"
|
| affected_api: "TrainingArguments.evaluation_strategy"
|
| description: "Renamed evaluation_strategy -> eval_strategy"
|
| breakage_primitive: "RenameApiCall"
|
| params:
|
| old_name: "evaluation_strategy"
|
| new_name: "eval_strategy"
|
| repair_primitive: "RestoreApiCall"
|
| category: "api_drift"
|
|
|
| - version_range: "datasets 2.14 -> 3.0"
|
| affected_api: "load_dataset"
|
| description: "Default split column was renamed in some GLUE configs"
|
| breakage_primitive: "RestructureDatasetSchema"
|
| params:
|
| old_column: "label"
|
| new_column: "labels"
|
| repair_primitive: "RestoreColumn"
|
| category: "dataset_drift"
|
|
|
| - version_range: "transformers 4.40 -> 4.50"
|
| affected_api: "Trainer.predict"
|
| description: "Method removed; users should use evaluate() with prediction_loss_only=False"
|
| breakage_primitive: "RemoveDeprecatedMethod"
|
| params:
|
| class_name: "Trainer"
|
| method_name: "predict"
|
| replacement: "evaluate"
|
| repair_primitive: "RestoreMethod"
|
| category: "api_drift"
|
|
|
| - version_range: "transformers 4.36 -> 4.40"
|
| affected_api: "TrainingArguments"
|
| description: "num_train_epochs default behavior changed; max_steps now preferred"
|
| breakage_primitive: "ModifyConfigField"
|
| params:
|
| config_class: "TrainingArguments"
|
| field_name: "num_train_epochs"
|
| new_value: "0"
|
| repair_primitive: "RestoreConfigField"
|
| category: "config_drift"
|
|
|
| - version_range: "transformers 4.34 -> 4.42"
|
| affected_api: "Tokenizer.__call__"
|
| description: "padding=True semantics changed; users should pass padding='max_length'"
|
| breakage_primitive: "ChangeTokenizerBehavior"
|
| params:
|
| old_kwarg: "padding"
|
| old_value: "True"
|
| new_kwarg: "padding"
|
| new_value: '"max_length"'
|
| repair_primitive: "RestoreTokenizerKwarg"
|
| category: "tokenizer_drift"
|
|
|
| - version_range: "transformers 4.20 -> 4.30"
|
| affected_api: "imports"
|
| description: "transformers.training_args moved to transformers.training_args_pt"
|
| breakage_primitive: "DeprecateImport"
|
| params:
|
| old_module: "from transformers.training_args"
|
| new_module: "from transformers.training_args_pt"
|
| repair_primitive: "RestoreImport"
|
| category: "import_drift"
|
|
|
| - version_range: "transformers 4.45 -> 4.50"
|
| affected_api: "save_pretrained"
|
| description: "save_pretrained() now requires safe_serialization to default True"
|
| breakage_primitive: "ChangeArgumentSignature"
|
| params:
|
| function_name: "save_pretrained"
|
| removed_arg: "safe_serialization"
|
| added_arg: "safe_serialization"
|
| added_value: "True"
|
| repair_primitive: "RestoreArgument"
|
| category: "api_drift"
|
|
|
| - version_range: "datasets 2.18 -> 3.0"
|
| affected_api: "Dataset.set_format"
|
| description: "set_format(type='torch') signature stricter, columns required"
|
| breakage_primitive: "ChangeArgumentSignature"
|
| params:
|
| function_name: "set_format"
|
| removed_arg: "columns"
|
| added_arg: "columns"
|
| added_value: '["input_ids", "attention_mask", "labels"]'
|
| repair_primitive: "RestoreArgument"
|
| category: "api_drift"
|
|
|
| - version_range: "transformers 4.36 -> 4.45"
|
| affected_api: "Tokenizer.__call__"
|
| description: "max_length default reduced from 512 -> 256 for some tokenizers"
|
| breakage_primitive: "ModifyConfigField"
|
| params:
|
| config_class: "tokenizer"
|
| field_name: "max_length"
|
| new_value: "256"
|
| repair_primitive: "RestoreConfigField"
|
| category: "tokenizer_drift"
|
|
|
| - version_range: "transformers 4.40 -> 4.45"
|
| affected_api: "DataCollatorWithPadding"
|
| description: "Renamed `tokenizer` -> `processing_class` in DataCollator constructors"
|
| breakage_primitive: "RenameApiCall"
|
| params:
|
| old_name: "tokenizer"
|
| new_name: "processing_class"
|
| repair_primitive: "RestoreApiCall"
|
| category: "api_drift"
|
|
|
| - version_range: "datasets 2.14 -> 2.18"
|
| affected_api: "load_dataset"
|
| description: "Some splits renamed train[:500] semantics changed"
|
| breakage_primitive: "RestructureDatasetSchema"
|
| params:
|
| old_column: "sentence"
|
| new_column: "text"
|
| repair_primitive: "RestoreColumn"
|
| category: "dataset_drift"
|
|
|
| - version_range: "transformers 4.45 -> 4.50"
|
| affected_api: "Trainer"
|
| description: "evaluation_strategy was deprecated and removed"
|
| breakage_primitive: "RemoveDeprecatedMethod"
|
| params:
|
| class_name: "Trainer"
|
| method_name: "evaluate"
|
| replacement: "evaluate_legacy"
|
| repair_primitive: "RestoreMethod"
|
| category: "api_drift"
|
|
|
| - version_range: "transformers 4.30 -> 4.40"
|
| affected_api: "PreTrainedModel.from_pretrained"
|
| description: "torch_dtype now required for some quantized model paths"
|
| breakage_primitive: "ChangeArgumentSignature"
|
| params:
|
| function_name: "from_pretrained"
|
| removed_arg: "torch_dtype"
|
| added_arg: "torch_dtype"
|
| added_value: '"auto"'
|
| repair_primitive: "RestoreArgument"
|
| category: "api_drift"
|
|
|
| - version_range: "datasets 3.0 -> 3.2"
|
| affected_api: "Dataset.rename_column"
|
| description: "rename_column raises if target name exists"
|
| breakage_primitive: "RestructureDatasetSchema"
|
| params:
|
| old_column: "labels"
|
| new_column: "label"
|
| repair_primitive: "RestoreColumn"
|
| category: "dataset_drift"
|
|
|
| - version_range: "transformers 4.36 -> 4.42"
|
| affected_api: "TrainingArguments.report_to"
|
| description: "Default report_to changed from 'all' to 'none'"
|
| breakage_primitive: "ModifyConfigField"
|
| params:
|
| config_class: "TrainingArguments"
|
| field_name: "report_to"
|
| new_value: '"all"'
|
| repair_primitive: "RestoreConfigField"
|
| category: "config_drift"
|
|
|
| - version_range: "transformers 4.40 -> 4.50"
|
| affected_api: "imports"
|
| description: "transformers.deepspeed moved to accelerate.utils.deepspeed"
|
| breakage_primitive: "DeprecateImport"
|
| params:
|
| old_module: "from transformers.deepspeed"
|
| new_module: "from accelerate.utils.deepspeed"
|
| repair_primitive: "RestoreImport"
|
| category: "import_drift"
|
|
|
| - version_range: "transformers 4.45 -> 4.50"
|
| affected_api: "Tokenizer return"
|
| description: "Tokenizer call output now returns a BatchEncoding with .encodings attribute"
|
| breakage_primitive: "ChangeReturnType"
|
| params:
|
| function_name: "tokenizer"
|
| old_access: "tokenizer(text)"
|
| new_access: "tokenizer(text).encodings"
|
| repair_primitive: "RestoreReturnAccess"
|
| category: "api_drift"
|
|
|
| - version_range: "transformers 4.30 -> 4.40"
|
| affected_api: "save_pretrained"
|
| description: "save_pretrained -> save_pretrained_directory rename in some classes"
|
| breakage_primitive: "RenameApiCall"
|
| params:
|
| old_name: "save_pretrained"
|
| new_name: "save_pretrained_directory"
|
| repair_primitive: "RestoreApiCall"
|
| category: "api_drift"
|
|
|
| - version_range: "transformers 4.45 -> 4.50"
|
| affected_api: "TrainingArguments.no_cuda"
|
| description: "no_cuda renamed to use_cpu (logic inverted)"
|
| breakage_primitive: "RenameApiCall"
|
| params:
|
| old_name: "no_cuda"
|
| new_name: "use_cpu"
|
| repair_primitive: "RestoreApiCall"
|
| category: "config_drift"
|
|
|