Implement Mamba MeanFlow x-prediction training

This commit is contained in:
Logic
2026-03-11 16:33:40 +08:00
parent 01fc1e4eab
commit 9b2968997c
5 changed files with 353 additions and 121 deletions

View File

@@ -4,7 +4,7 @@ from as_mamba import TrainConfig, run_training_and_plot
def build_parser() -> argparse.ArgumentParser:
parser = argparse.ArgumentParser(description="Train AS-Mamba on MNIST flow matching.")
parser = argparse.ArgumentParser(description="Train AS-Mamba on MNIST MeanFlow x-prediction.")
parser.add_argument("--epochs", type=int, default=None)
parser.add_argument("--steps-per-epoch", type=int, default=None)
parser.add_argument("--batch-size", type=int, default=None)
@@ -15,10 +15,8 @@ def build_parser() -> argparse.ArgumentParser:
parser.add_argument("--output-dir", type=str, default=None)
parser.add_argument("--project", type=str, default=None)
parser.add_argument("--run-name", type=str, default=None)
parser.add_argument("--dt-alpha", type=float, default=None)
parser.add_argument("--dt-min", type=float, default=None)
parser.add_argument("--dt-max", type=float, default=None)
parser.add_argument("--lambda-flow", type=float, default=None)
parser.add_argument("--lambda-perceptual", type=float, default=None)
parser.add_argument("--num-classes", type=int, default=None)
parser.add_argument("--image-size", type=int, default=None)
parser.add_argument("--channels", type=int, default=None)
@@ -36,6 +34,8 @@ def build_parser() -> argparse.ArgumentParser:
parser.add_argument("--val-every", type=int, default=None)
parser.add_argument("--val-samples-per-class", type=int, default=None)
parser.add_argument("--val-grid-rows", type=int, default=None)
parser.add_argument("--val-sampling-steps", type=int, default=None)
parser.add_argument("--time-grid-size", type=int, default=None)
parser.add_argument("--use-ddp", action=argparse.BooleanOptionalAction, default=None)
return parser