Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
18 commits
Select commit Hold shift + click to select a range
9d35997
Fix BLT training_ci overfit test by disabling cache and adjusting tra…
preetam1407 Dec 7, 2025
23da2e1
Fix BLT training_ci overfit test by disabling cache and adjusting tra…
preetam1407 Dec 7, 2025
624e22c
Fix BLT training_ci overfit test by disabling cache and adjusting tra…
preetam1407 Dec 7, 2025
b4504b9
Format BLT tests with ruff
preetam1407 Dec 7, 2025
5902dec
Merge branch 'main' into fix-blt-training-ci
3outeille Dec 8, 2025
832581d
Fix BLT training CI with custom weight initialization and overfit test
preetam1407 Dec 11, 2025
9feb586
Fix BLT training CI with custom weight initialization and overfit test
preetam1407 Dec 11, 2025
00d1897
Fix BLT training CI with custom weight initialization and overfit test
preetam1407 Dec 11, 2025
3e5700e
Fix BLT training CI with custom weight initialization and overfit test
preetam1407 Dec 11, 2025
495094c
Fix BLT training CI with custom weight initialization and overfit test
preetam1407 Dec 11, 2025
a7ce3b7
Fix BLT training CI with custom weight initialization and overfit test
preetam1407 Dec 11, 2025
bd279d9
Update BLT init logic and adjust repo checks for non-functional model…
preetam1407 Dec 11, 2025
4e64382
Fix repo/config checks by marking BLT Text/Vision models as placeholders
preetam1407 Dec 11, 2025
9803753
Fix repo/config checks by marking BLT Text/Vision models as placeholders
preetam1407 Dec 11, 2025
884ff6b
Fix repo/config checks by marking BLT Text/Vision models as placeholders
preetam1407 Dec 11, 2025
1414e70
Merge branch 'main' into fix-blt-training-ci
3outeille Dec 11, 2025
e60b3a3
Document BLT weight initialization sources and restore default overfi…
preetam1407 Dec 11, 2025
6c53915
Align BLT weight init with nn.init
preetam1407 Dec 11, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
22 changes: 22 additions & 0 deletions src/transformers/models/blt/configuration_blt.py
Original file line number Diff line number Diff line change
Expand Up @@ -335,6 +335,7 @@ def __init__(
tie_word_embeddings: Optional[bool] = False,
initializer_range: Optional[float] = 0.02,
rope_parameters: Optional[RopeParameters | dict[str, RopeParameters]] = None,
use_cache: Optional[bool] = False,
**kwargs,
):
# Basic model configuration
Expand Down Expand Up @@ -406,16 +407,37 @@ def __init__(
)

self.rope_parameters = rope_parameters
if "use_cache" not in kwargs:
kwargs["use_cache"] = use_cache
self.use_cache = kwargs["use_cache"]

# Remove tie_word_embeddings from kwargs to avoid duplicate parameter error
kwargs.pop("tie_word_embeddings", None)
super().__init__(tie_word_embeddings=tie_word_embeddings, **kwargs)


class BltTextConfig(PreTrainedConfig):
"""
Configuration class for the Blt Text component.
"""

pass


class BltVisionConfig(PreTrainedConfig):
"""
Configuration class for the Blt Vision component.
"""

pass


__all__ = [
"BltConfig",
"BltPatcherConfig",
"BltLocalEncoderConfig",
"BltLocalDecoderConfig",
"BltGlobalTransformerConfig",
"BltTextConfig",
"BltVisionConfig",
]
Loading