rtferraz's picture
Update package init to v0.2.0 with model exports
b86b1ee verified
raw
history blame
940 Bytes
"""
domainTokenizer — Building small models that understand domain tokens, not just words.
Core components:
- schema: DomainSchema, FieldSpec, FieldType
- tokenizers: DomainTokenizerBuilder, per-field tokenizers
- schemas: Predefined schemas (FINANCE, ECOMMERCE, HEALTHCARE)
- models: DomainTransformerForCausalLM, PLR, JointFusion
"""
from .schema import DomainSchema, FieldSpec, FieldType
from .tokenizers.domain_tokenizer import DomainTokenizerBuilder
from .tokenizers.field_tokenizers import (
BaseFieldTokenizer,
CalendarTokenizer,
CategoricalTokenizer,
DiscreteNumericalTokenizer,
MagnitudeBucketTokenizer,
SignTokenizer,
)
from .models.configuration import DomainTransformerConfig
from .models.modeling import DomainTransformerForCausalLM, DomainTransformerModel
from .models.plr_embeddings import PeriodicLinearReLU
from .models.joint_fusion import JointFusionModel, DCNv2
__version__ = "0.2.0"