model:
model_config:
type: TestModelConfig
text_config:
type: TestTextConfig
vision_config:
type: TestVisionConfig
arch:
type: TestModel
loss:
type: TestL1Loss
reduction: 'mean'
metric:
type: TestAccuracy
eval_type: 'classification'
train_dataset: &train_dataset
data_loader:
type: TestDataLoader
dataset_dir: "/dataset/imageNet-1k/train"
transforms:
- type: TestTransforms1
- type: TestTransforms1
sampler:
type: TestSampler
mask_policy:
type: TestModelMask
input_columns: ["image"]
output_columns: [ "image", "mask"]
column_order: [ "image", "mask"]
num_parallel_workers: 8
python_multiprocessing: False
drop_remainder: True
batch_size: 128
repeat: 1
numa_enable: False
prefetch_size: 30
train_dataset_task:
type: TestDataset
dataset_config: *train_dataset
runner_wrapper:
type: TestTrainOneStepWithLossScaleCell
scale_sense: 1024
optimizer:
type: TestAdamWeightDecay
beta1: 0.9
beta2: 0.999
eps: 0.00000001
weight_decay: 0.05
lr_schedule:
type: TestCosineDecayLR
max_lr: 0.00015
min_lr: 0.
decay_steps: 100
runner_config:
epochs: 800
batch_size: 64
sink_mode: True
sink_size: 1
callbacks:
- type: TestLLossMonitor
per_print_times: 10
- type: TestTimeMonitor
data_size: 100
do_train: True
do_eval: False
do_predict: False
pipeline:
type: TestPipeline
processor:
type: TestProcessor
trainer:
type: CausalLanguageModelingTrainer
model_name: 'test_model'