pytorch · kashif · Apr 10, 2025 · Apr 10, 2025 · Apr 10, 2025 · wwwjn
diff --git a/torchtitan/experiments/flux/README.md b/torchtitan/experiments/flux/README.md
@@ -2,6 +2,12 @@
 
 ## Overview
 
+## Install dependencies
+
+```bash
+pip install -U -r requirements.txt
+```
+
 ## Usage
 First, download the autoencoder model from HuggingFace with your own access token:
 ```bash

diff --git a/torchtitan/experiments/flux/__init__.py b/torchtitan/experiments/flux/__init__.py
@@ -10,7 +10,6 @@
 from torchtitan.components.optimizer import build_optimizers
 from torchtitan.experiments.flux.dataset.flux_dataset import build_flux_dataloader
 from torchtitan.experiments.flux.loss import build_mse_loss
-from torchtitan.experiments.flux.model.autoencoder import AutoEncoderParams
 from torchtitan.experiments.flux.parallelize_flux import parallelize_flux
 from torchtitan.protocols.train_spec import register_train_spec, TrainSpec
 
@@ -39,17 +38,6 @@
         theta=10_000,
         qkv_bias=True,
         guidance_embed=True,
-        autoencoder_params=AutoEncoderParams(
-            resolution=256,
-            in_channels=3,
-            ch=128,
-            out_ch=3,
-            ch_mult=(1, 2, 4, 4),
-            num_res_blocks=2,
-            z_channels=16,
-            scale_factor=0.3611,
-            shift_factor=0.1159,
-        ),
     ),
     "flux-schnell": FluxModelArgs(
         in_channels=64,
@@ -65,17 +53,6 @@
         theta=10_000,
         qkv_bias=True,
         guidance_embed=False,
-        autoencoder_params=AutoEncoderParams(
-            resolution=256,
-            in_channels=3,
-            ch=128,
-            out_ch=3,
-            ch_mult=(1, 2, 4, 4),
-            num_res_blocks=2,
-            z_channels=16,
-            scale_factor=0.3611,
-            shift_factor=0.1159,
-        ),
     ),
     "flux-debug": FluxModelArgs(
         in_channels=64,
@@ -91,17 +68,6 @@
         theta=10_000,
         qkv_bias=True,
         guidance_embed=True,
-        autoencoder_params=AutoEncoderParams(
-            resolution=256,
-            in_channels=3,
-            ch=128,
-            out_ch=3,
-            ch_mult=(1, 2, 4, 4),
-            num_res_blocks=2,
-            z_channels=16,
-            scale_factor=0.3611,
-            shift_factor=0.1159,
-        ),
     ),
 }