File size: 940 Bytes
0c1ca58
 
 
 
 
 
 
b86b1ee
0c1ca58
 
 
 
 
 
 
 
 
 
 
 
b86b1ee
 
 
 
0c1ca58
b86b1ee
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
"""
domainTokenizer — Building small models that understand domain tokens, not just words.

Core components:
  - schema: DomainSchema, FieldSpec, FieldType
  - tokenizers: DomainTokenizerBuilder, per-field tokenizers
  - schemas: Predefined schemas (FINANCE, ECOMMERCE, HEALTHCARE)
  - models: DomainTransformerForCausalLM, PLR, JointFusion
"""

from .schema import DomainSchema, FieldSpec, FieldType
from .tokenizers.domain_tokenizer import DomainTokenizerBuilder
from .tokenizers.field_tokenizers import (
    BaseFieldTokenizer,
    CalendarTokenizer,
    CategoricalTokenizer,
    DiscreteNumericalTokenizer,
    MagnitudeBucketTokenizer,
    SignTokenizer,
)
from .models.configuration import DomainTransformerConfig
from .models.modeling import DomainTransformerForCausalLM, DomainTransformerModel
from .models.plr_embeddings import PeriodicLinearReLU
from .models.joint_fusion import JointFusionModel, DCNv2

__version__ = "0.2.0"