Automodel/examples/vlm_finetune/gemma4/gemma4_31b.yaml at main · NVIDIA-NeMo/Automodel

114 lines (94 loc) · 3.08 KB
# Copyright (c) 2025, NVIDIA CORPORATION.  All rights reserved.
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# Configuration for fine-tuning Gemma 4 31B (dense) with MedPix dataset for image description
# Requires 8 GPUs (FSDP2 with activation checkpointing)
# torchrun --nproc-per-node=8 examples/vlm_finetune/finetune.py -c examples/vlm_finetune/gemma4/gemma4_31b.yaml
recipe: FinetuneRecipeForVLM
step_scheduler:
  global_batch_size: 8
  local_batch_size: 1
  ckpt_every_steps: 500
  val_every_steps: 500
  num_epochs: 2
  backend: nccl
  timeout_minutes: 60
  _target_: nemo_automodel.components.training.rng.StatefulRNG
  ranked: true
  _target_: nemo_automodel.NeMoAutoModelForImageTextToText.from_pretrained
  pretrained_model_name_or_path: google/gemma-4-31B-it
  torch_dtype: torch.bfloat16
  use_liger_kernel: true
  use_sdpa_patching: false
  attn_implementation: eager
  # 31B does not using kv_shared layers (only used in 2B, 4B), hence use_cache: false.
  text_config:
    use_cache: false
  padding_side: right
checkpoint:
  enabled: true
  checkpoint_dir: vlm_checkpoints/gemma4_31b_it/
  model_save_format: torch_save
  save_consolidated: false
distributed:
  strategy: fsdp2
  dp_size: none
  tp_size: 1
  cp_size: 1
  sequence_parallel: false
  # Activation checkpointing is required for Gemma4 31B to fit in memory, fsdp alone leads to OOM.
  activation_checkpointing: true
  _target_: nemo_automodel.components.loss.masked_ce.MaskedCrossEntropy
  _target_: nemo_automodel.components.datasets.vlm.datasets.make_medpix_dataset
  path_or_dataset: mmoukouba/MedPix-VQA
  split: train[:1000]
dataloader:
  _target_: torchdata.stateful_dataloader.StatefulDataLoader
  num_workers: 0
  pin_memory: true
  collate_fn:
    _target_: nemo_automodel.components.datasets.vlm.collate_fns.gemma4_prefix_collate_fn
validation_dataset:
  _target_: nemo_automodel.components.datasets.vlm.datasets.make_medpix_dataset
  path_or_dataset: mmoukouba/MedPix-VQA
  split: validation[:500]
validation_dataloader:
  _target_: torchdata.stateful_dataloader.StatefulDataLoader
  collate_fn:
    _target_: nemo_automodel.components.datasets.vlm.collate_fns.gemma4_prefix_collate_fn
  _target_: torch.optim.AdamW
  weight_decay: 0.01
  betas: [0.9, 0.95]
lr_scheduler:
  lr_decay_style: cosine
freeze_config:
  freeze_embeddings: true
  freeze_vision_tower: true
  freeze_audio_tower: true
  freeze_language_model: false
#   project: <your-project>
#   entity: <your-entity>
#   name: <your-run-name>
  recipe_owner: athitten
  time: "00:20:00"
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

gemma4_31b.yaml

Latest commit

History

gemma4_31b.yaml

File metadata and controls