google
diff --git a/‎.github/workflows/cpu-tests.yml‎
Lines changed: 44 additions & 44 deletions b/‎.github/workflows/cpu-tests.yml‎
Lines changed: 44 additions & 44 deletions
diff --git a/‎.github/workflows/tpu-tests.yml‎
Lines changed: 91 additions & 91 deletions b/‎.github/workflows/tpu-tests.yml‎
Lines changed: 91 additions & 91 deletions
diff --git a/‎tests/cli/utils/model_test.py‎
Lines changed: 31 additions & 7 deletions b/‎tests/cli/utils/model_test.py‎
Lines changed: 31 additions & 7 deletions
diff --git a/‎tunix/cli/config.py‎
Lines changed: 1 addition & 0 deletions b/‎tunix/cli/config.py‎
Lines changed: 1 addition & 0 deletions
@@ -26,54 +26,54 @@ jobs:
   # copybara:strip_begin
   # LINT.IfChange()
   # copybara:strip_end
-  run:
-  # copybara:strip_begin
-  # LINT.ThenChange(Internal path for github_actions, don't change this line.)
-  # copybara:strip_end
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-      - uses: actions/setup-python@v4
-        with:
-          python-version: '3.11'
+  # run:
+  # # copybara:strip_begin
+  # # LINT.ThenChange(Internal path for github_actions, don't change this line.)
+  # # copybara:strip_end
+  #   runs-on: ubuntu-latest
+  #   steps:
+  #     - uses: actions/checkout@v4
+  #     - uses: actions/setup-python@v4
+  #       with:
+  #         python-version: '3.11'
 
-      - name: Download the tunix wheel
-        uses: actions/download-artifact@634f93cb2916e3fdff6788551b99b062d0335ce0 # v5.0.0
-        with:
-          name: tunix-wheel
+  #     - name: Download the tunix wheel
+  #       uses: actions/download-artifact@634f93cb2916e3fdff6788551b99b062d0335ce0 # v5.0.0
+  #       with:
+  #         name: tunix-wheel
 
-      - name: Install the tunix wheel
-        run: |
-          python -m pip install --upgrade pip
-          python -m pip install google_tunix-*-py3-none-any.whl
-          python -m pip install pytest
+  #     - name: Install the tunix wheel
+  #       run: |
+  #         python -m pip install --upgrade pip
+  #         python -m pip install google_tunix-*-py3-none-any.whl
+  #         python -m pip install pytest
 
-      - name: Verify Tunix imports from installed package
-        run: |
-          python3 -c "
-          import tunix
-          import tunix.models
-          import tunix.generate
-          import tunix.sft
-          import tunix.distillation
-          import tunix.rl
+  #     - name: Verify Tunix imports from installed package
+  #       run: |
+  #         python3 -c "
+  #         import tunix
+  #         import tunix.models
+  #         import tunix.generate
+  #         import tunix.sft
+  #         import tunix.distillation
+  #         import tunix.rl
 
-          assert tunix.__version__ != '0.0.0.dev0', 'Tunix version not set correctly'
-          print('All tunix modules imported successfully and version is', tunix.__version__)
-          "
-      - name: Run agentic RL tests
-        run: |
-          python -m pytest tests/rl/agentic/ -v --tb=short
+  #         assert tunix.__version__ != '0.0.0.dev0', 'Tunix version not set correctly'
+  #         print('All tunix modules imported successfully and version is', tunix.__version__)
+  #         "
+  #     - name: Run agentic RL tests
+  #       run: |
+  #         python -m pytest tests/rl/agentic/ -v --tb=short
 
-      - name: Run Cli utils tests
-        run: |
-          python -m pytest tests/cli/utils/ -v --tb=short
+  #     - name: Run Cli utils tests
+  #       run: |
+  #         python -m pytest tests/cli/utils/ -v --tb=short
 
-      - name: Run model alignment tests
-        run: |
-          python -m pip install torch
-          python -m pytest tests/model_alignment/ -v --tb=short
+  #     - name: Run model alignment tests
+  #       run: |
+  #         python -m pip install torch
+  #         python -m pytest tests/model_alignment/ -v --tb=short
 
-      - name: Run perf tests
-        run: |
-          python -m pytest tests/perf/ -v --tb=short
+  #     - name: Run perf tests
+  #       run: |
+  #         python -m pytest tests/perf/ -v --tb=short
@@ -33,97 +33,97 @@ env:
   HF_HUB_ENABLE_HF_TRANSFER: "1"
 
 jobs:
-  run_prod:
-    runs-on: [linux-x86-ct5lp-224-8tpu]
-    environment: testing
-    container:
-      image: us-docker.pkg.dev/tpu-prod-env-multipod/jax-stable-stack/candidate/tpu:latest
-      options: --privileged
-      env:
-        CLOUD_TPU_ACCELERATOR: v5e-8
-        JAX_PLATFORMS: tpu
-    steps:
-
-    # Cache Hugging Face hub
-    - name: Cache HF hub
-      uses: actions/cache@v4
-      with:
-        path: ~/.cache/huggingface
-        key: hf-${{ runner.os }}-${{ hashFiles('pyproject.toml', 'requirements*.txt', 'constraints*.txt') }}
-        restore-keys: |
-          hf-${{ runner.os }}-
-
-    - name: Checkout code
-      uses: actions/checkout@v4
-      with:
-        fetch-depth: 0
-
-    - name: Install tunix dependencies
-      run: |
-        pip install --upgrade pip
-        pip install -e .[prod] --force-reinstall
-        pip install pytest pytest-xdist
-
-    - name: Verify TPU availability
-      run: |
-        python -c "
-        import jax
-        print(f'JAX version: {jax.__version__}')
-        print(f'JAX devices: {jax.devices()}')
-
-        # Check if we have TPU devices specifically
-        devices = jax.devices()
-        has_tpu = len(devices) > 0 and all(device.platform == 'tpu' for device in devices)
-        print(f'TPU available: {has_tpu}')
-
-        if not has_tpu:
-            print('ERROR: No TPU devices found! Expected TPU devices but got:', [device.platform for device in devices])
-            exit(1)
-        else:
-            print(f'SUCCESS: Found {len(devices)} TPU device(s)')
-        "
-
-    - name: Run tunix model tests
-      run: |
-        python -m pytest tests/models/ -v --tb=short -m "not cpu_only and not gpu_only"
-
-    - name: Run tunix generation tests (PASSED only)
-      run: |
-        # tokenizer_adapter_test requires access to gated repo
-        # TODO(b/459824938) Add back test_logprobs_extraction_with_missing_token after fixing the issue
-        python -m pytest tests/generate/ -v --tb=short \
-          --ignore=tests/generate/vllm_sampler_test.py \
-          --ignore=tests/generate/vllm_driver_test.py \
-          --ignore=tests/generate/tokenizer_adapter_test.py \
-          --ignore=tests/generate/sglang_jax_sampler_test.py \
-          --ignore=tests/generate/utils_test.py
-
-        python -m pytest tests/generate/utils_test.py -k "not test_logprobs_extraction_with_missing_token"
-
-    - name: Run tunix SFT tests
-      run: |
-        python -m pytest tests/sft/ -v --tb=short
-
-    - name: Run tunix distillation tests
-      run: |
-        python -m pytest tests/distillation/ -v --tb=short
-
-    - name: Run tunix RL tests
-      run: |
-        # RL common tests that passed
-        # b/448133814: test_grpo_with_lora_model fails
-        python -m pytest tests/rl/ -v --tb=short -k "not test_grpo_with_lora_model" --ignore=tests/rl/experimental/agentic
-
-    - name: Run tunix tests not covered by the above categories
-      run: |
-        # This category is to catch tests added but not covered by CI yet. Whenever you add new folders under tests/, please add a new category above and skip those tests here.
-        python -m pytest tests/ -v --tb=short --ignore=tests/perf/ --ignore=tests/model_alignment/ --ignore=tests/models/ --ignore=tests/cli/ --ignore=tests/generate/ --ignore=tests/sft/ --ignore=tests/distillation/ --ignore=tests/rl/ || code=$?
-        if [ "${code:-0}" = "5" ]; then
-          echo "No tests collected (expected)."
-          exit 0
-        else
-          exit "${code:-0}"
-        fi
+  # run_prod:
+  #   runs-on: [linux-x86-ct5lp-224-8tpu]
+  #   environment: testing
+  #   container:
+  #     image: us-docker.pkg.dev/tpu-prod-env-multipod/jax-stable-stack/candidate/tpu:latest
+  #     options: --privileged
+  #     env:
+  #       CLOUD_TPU_ACCELERATOR: v5e-8
+  #       JAX_PLATFORMS: tpu
+  #   steps:
+
+  #   # Cache Hugging Face hub
+  #   - name: Cache HF hub
+  #     uses: actions/cache@v4
+  #     with:
+  #       path: ~/.cache/huggingface
+  #       key: hf-${{ runner.os }}-${{ hashFiles('pyproject.toml', 'requirements*.txt', 'constraints*.txt') }}
+  #       restore-keys: |
+  #         hf-${{ runner.os }}-
+
+  #   - name: Checkout code
+  #     uses: actions/checkout@v4
+  #     with:
+  #       fetch-depth: 0
+
+  #   - name: Install tunix dependencies
+  #     run: |
+  #       pip install --upgrade pip
+  #       pip install -e .[prod] --force-reinstall
+  #       pip install pytest pytest-xdist
+
+  #   - name: Verify TPU availability
+  #     run: |
+  #       python -c "
+  #       import jax
+  #       print(f'JAX version: {jax.__version__}')
+  #       print(f'JAX devices: {jax.devices()}')
+
+  #       # Check if we have TPU devices specifically
+  #       devices = jax.devices()
+  #       has_tpu = len(devices) > 0 and all(device.platform == 'tpu' for device in devices)
+  #       print(f'TPU available: {has_tpu}')
+
+  #       if not has_tpu:
+  #           print('ERROR: No TPU devices found! Expected TPU devices but got:', [device.platform for device in devices])
+  #           exit(1)
+  #       else:
+  #           print(f'SUCCESS: Found {len(devices)} TPU device(s)')
+  #       "
+
+  #   - name: Run tunix model tests
+  #     run: |
+  #       python -m pytest tests/models/ -v --tb=short -m "not cpu_only and not gpu_only"
+
+  #   - name: Run tunix generation tests (PASSED only)
+  #     run: |
+  #       # tokenizer_adapter_test requires access to gated repo
+  #       # TODO(b/459824938) Add back test_logprobs_extraction_with_missing_token after fixing the issue
+  #       python -m pytest tests/generate/ -v --tb=short \
+  #         --ignore=tests/generate/vllm_sampler_test.py \
+  #         --ignore=tests/generate/vllm_driver_test.py \
+  #         --ignore=tests/generate/tokenizer_adapter_test.py \
+  #         --ignore=tests/generate/sglang_jax_sampler_test.py \
+  #         --ignore=tests/generate/utils_test.py
+
+  #       python -m pytest tests/generate/utils_test.py -k "not test_logprobs_extraction_with_missing_token"
+
+  #   - name: Run tunix SFT tests
+  #     run: |
+  #       python -m pytest tests/sft/ -v --tb=short
+
+  #   - name: Run tunix distillation tests
+  #     run: |
+  #       python -m pytest tests/distillation/ -v --tb=short
+
+  #   - name: Run tunix RL tests
+  #     run: |
+  #       # RL common tests that passed
+  #       # b/448133814: test_grpo_with_lora_model fails
+  #       python -m pytest tests/rl/ -v --tb=short -k "not test_grpo_with_lora_model" --ignore=tests/rl/experimental/agentic
+
+  #   - name: Run tunix tests not covered by the above categories
+  #     run: |
+  #       # This category is to catch tests added but not covered by CI yet. Whenever you add new folders under tests/, please add a new category above and skip those tests here.
+  #       python -m pytest tests/ -v --tb=short --ignore=tests/perf/ --ignore=tests/model_alignment/ --ignore=tests/models/ --ignore=tests/cli/ --ignore=tests/generate/ --ignore=tests/sft/ --ignore=tests/distillation/ --ignore=tests/rl/ || code=$?
+  #       if [ "${code:-0}" = "5" ]; then
+  #         echo "No tests collected (expected)."
+  #         exit 0
+  #       else
+  #         exit "${code:-0}"
+  #       fi
 
   run_dev:
     if: ${{ github.event_name != 'pull_request' || github.event.pull_request.head.repo.full_name == github.repository }}
 
@@ -78,6 +78,26 @@
         testcase_name="gemma3-27b",
         model_name="gemma3-27b",
     ),
+    dict(
+        testcase_name="gemma-3-270m",
+        model_name="gemma-3-270m",
+    ),
+    dict(
+        testcase_name="gemma-3-1b",
+        model_name="gemma-3-1b",
+    ),
+    dict(
+        testcase_name="gemma-3-4b",
+        model_name="gemma-3-4b",
+    ),
+    dict(
+        testcase_name="gemma-3-12b",
+        model_name="gemma-3-12b",
+    ),
+    dict(
+        testcase_name="gemma-3-27b",
+        model_name="gemma-3-27b",
+    ),
     dict(
         testcase_name="llama3-70b",
         model_name="llama3-70b",
@@ -118,11 +138,10 @@
         testcase_name="qwen2.5-math-1.5b",
         model_name="qwen2.5-math-1.5b",
     ),
-    # TODO(b/451662153): support deepseek model name parsing
-    # dict(
-    #     testcase_name="deepseek-r1-distill-qwen-1.5b",
-    #     model_name="deepseek-r1-distill-qwen-1.5b",
-    # ),
+    dict(
+        testcase_name="deepseek-r1-distill-qwen-1.5b",
+        model_name="deepseek-r1-distill-qwen-1.5b",
+    ),
     dict(
         testcase_name="qwen3-0.6b",
         model_name="qwen3-0.6b",
@@ -151,10 +170,15 @@ def test_obtain_model_params_valid(self, model_name: str):
     model.obtain_model_params(model_name)
 
   def test_create_model_dynamically_routing(self, model_name: str):
-    model_module = model.get_model_module(model_name)
+    params_module = model.get_model_module(model_name, model.ModelModule.PARAMS)
     if not model_name.startswith("gemma"):
       # TODO(b/444572467)
-      getattr(model_module, "create_model_from_safe_tensors")
+      getattr(params_module, "create_model_from_safe_tensors")
+
+    model_lib_module = model.get_model_module(
+        model_name, model.ModelModule.MODEL
+    )
+    getattr(model_lib_module, "ModelConfig")
 
 
 if __name__ == "__main__":
 
@@ -345,6 +345,7 @@ def create_optimizer(
           " https://optax.readthedocs.io/en/latest/api/optimizers.html#optimizers"
       ) from e
 
+    logging.info("[SHADI] optimizer_config: %s", optimizer_config)
     # Handle learning rate, potentially creating a schedule
     learning_rate_val = self._create_learning_rate(
         optimizer_config, config_path_info