Thinklab-SJTU
diff --git a/‎.gitignore
Lines changed: 167 additions & 0 deletions b/‎.gitignore
Lines changed: 167 additions & 0 deletions
diff --git a/‎README.md
Lines changed: 23 additions & 1 deletion b/‎README.md
Lines changed: 23 additions & 1 deletion
diff --git a/‎config/test_dataloader/dynamic_camera_eval.yaml
Lines changed: 10 additions & 0 deletions b/‎config/test_dataloader/dynamic_camera_eval.yaml
Lines changed: 10 additions & 0 deletions
diff --git a/‎config/test_dataloader/dynamic_camera_train.yaml
Lines changed: 10 additions & 0 deletions b/‎config/test_dataloader/dynamic_camera_train.yaml
Lines changed: 10 additions & 0 deletions
diff --git a/‎config/test_dataloader/fixed_camera.yaml
Lines changed: 10 additions & 0 deletions b/‎config/test_dataloader/fixed_camera.yaml
Lines changed: 10 additions & 0 deletions
diff --git a/‎pyproject.toml
Lines changed: 50 additions & 0 deletions b/‎pyproject.toml
Lines changed: 50 additions & 0 deletions
diff --git a/‎script/generate_data.sh
Lines changed: 7 additions & 0 deletions b/‎script/generate_data.sh
Lines changed: 7 additions & 0 deletions
diff --git a/‎script/get_statistics.sh
Lines changed: 5 additions & 0 deletions b/‎script/get_statistics.sh
Lines changed: 5 additions & 0 deletions
diff --git a/‎script/set_path.sh
Lines changed: 59 additions & 0 deletions b/‎script/set_path.sh
Lines changed: 59 additions & 0 deletions
diff --git a/‎script/window.sh
Lines changed: 7 additions & 0 deletions b/‎script/window.sh
Lines changed: 7 additions & 0 deletions
@@ -0,0 +1,167 @@
+# dataset
+/b2d_dynamic_camera
+/b2d_fixed_camera
+/log
+
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+.pybuilder/
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/latest/usage/project/#working-with-version-control
+.pdm.toml
+.pdm-python
+.pdm-build/
+
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+
+# SageMath parsed files
+*.sage.py
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Pyre type checker
+.pyre/
+
+# pytype static type analyzer
+.pytype/
+
+# Cython debug symbols
+cython_debug/
+
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/
@@ -4,10 +4,32 @@
 </div>
 
 
-We are cleaning and organizing the code, and will open source all the training and inference code. Thanks for your patience.
+We are currently cleaning and organizing the code, and the publicly available part now is the data preprocessing section. Thank you for your patience in waiting for the training and inference code.
 
 [Project Page](https://thinklab-sjtu.github.io/DriveMoE/), [Paper](https://arxiv.org/abs/2505.16278)
 
+
+## Installation
+Before you begin, you need to ensure that your CUDA version is greater than 12.1.
+
+Clone this repository at your directory and run `pip install -e.` to install environment.
+
+Download PaliGemma weights to your directory.
+```console
+git clone https://huggingface.co/google/paligemma-3b-pt-224
+```
+
+If you wish to attempt training DrivePi0 and DriveMoE using the code, or to try open-loop testing with provided checkpoints, you will need to utilize the Bench2Drive dataset and our camera labels. You can download it here (https://huggingface.co/datasets/rethinklab/Bench2Drive)(https://huggingface.co/rethinklab/DriveMoE)
+
+Set environment variables `DATA_DIR` (if downloading datasets for training),`CAMERA_LABEL_DIR`, `LOG_DIR`, and `WANDB_ENTITY` by running `source scripts/set_path.sh`
+
+## Data processing
+Run these two scripts to preprocess the training data.
+```console
+sh script/generate_data.sh && script/window.sh
+```
+To normalize data during training, we provide dataset statistics. You may also run `sh get_statistics.sh` to generate them.
+
 ## Citation <a name="citation"></a>
 
 ```bibtex
 
@@ -0,0 +1,10 @@
+current_dir: "YOUR_CURRENT_WORK_DIR"  # You need to set path
+
+data:
+  val:
+    statistics_path: ${current_dir}/statistics.json
+    use_fixed_images: False
+    work_dir: ${current_dir}
+    split: val
+    num_of_action_experts: 6
+    shuffle_buffer_size: 200000
@@ -0,0 +1,10 @@
+current_dir: "YOUR_CURRENT_WORK_DIR"  # You need to set path
+
+data:
+  train:
+    statistics_path: ${current_dir}/statistics.json
+    use_fixed_images: False
+    work_dir: ${current_dir}
+    split: train
+    num_of_action_experts: 13
+    shuffle_buffer_size: 200000
@@ -0,0 +1,10 @@
+current_dir: "YOUR_CURRENT_WORK_DIR"  # You need to set path
+
+data:
+  train:
+    statistics_path: ${current_dir}/statistics.json
+    use_fixed_images: True
+    work_dir: ${current_dir}
+    split: None
+    num_of_action_experts: 44
+    shuffle_buffer_size: 200000
@@ -0,0 +1,50 @@
+[project]
+name = "DriveMoE"
+version = "0.1.0"
+description = "Open source codes for Drive-pi0 and DriveMoE"
+readme = "README.md"
+requires-python = "==3.10.*"
+classifiers = [
+    "Programming Language :: Python :: 3",
+]
+dependencies = [
+    "opencv-python",
+    "joblib",
+    "bitsandbytes",
+    "einops",
+    "gsutil>=5.32",
+    "hydra-core",
+    "imageio",
+    "matplotlib",
+    "numpy==1.26.4",
+    "omegaconf",
+    "pillow",
+    "pre-commit>=4.0.1",
+    "pretty_errors",
+    "protobuf==3.20.3",
+    "tensorflow==2.15.0",
+    "tensorflow_datasets==4.9.2",
+    "torch==2.5.0",
+    "torchvision==0.20.0",
+    "transformers",
+    "tqdm",
+    "wandb",
+]
+
+[build-system]
+requires = ["setuptools>=61.0"]
+build-backend = "setuptools.build_meta"
+
+[tool.setuptools.packages.find]
+exclude = []
+
+[tool.ruff]
+line-length = 88
+target-version = "py310"
+
+[tool.ruff.lint]
+select = ["A", "B", "E", "F", "I", "RUF", "W"]
+ignore = ["E203", "E501", "B006", "B026", "B905"]
+
+[tool.ruff.lint.per-file-ignores]
+"__init__.py" = ["E402", "F401", "F403"]
@@ -0,0 +1,7 @@
+#!/bin/bash
+
+DATASET_PATH="$DATA_DIR"
+WORK_DIR="${PWD}"
+CAM_ID_PATH="$CAMERA_LABEL_DIR"
+
+python "src/data_processing/generate_data.py" --dataset_path "$DATASET_PATH" --cam_id_path "$CAM_ID_PATH" --work_dir "$WORK_DIR"
@@ -0,0 +1,5 @@
+#!/bin/bash
+
+DATA_PATH="${PWD}/b2d_dynamic_camera/train"
+
+python "src/data_processing/get_statistics.py" --data_path "$DATA_PATH"
@@ -0,0 +1,59 @@
+#!/bin/bash
+
+##################### Paths #####################
+
+# Set default paths
+DEFAULT_DATA_DIR="${PWD}/Bench2Drive-Base"
+DEFAULT_LOG_DIR="${PWD}/log"
+DEFAULT_CAMERA_LABEL_DIR="${PWD}/camera_labels"
+PYTHONPATH="${PWD}"
+
+# Prompt the user for input, allowing overrides
+read -p "Enter the desired Bench2Drive Dataset directory [default: ${DEFAULT_DATA_DIR}], leave empty to use default: " DATA_DIR
+DATA_DIR=${DATA_DIR:-$DEFAULT_DATA_DIR}  # Use user input or default if input is empty
+
+read -p "Enter the desired camera labels directory [default: ${DEFAULT_CAMERA_LABEL_DIR}], leave empty to use default: " CAMERA_LABEL_DIR
+CAMERA_LABEL_DIR=${CAMERA_LABEL_DIR:-$DEFAULT_CAMERA_LABEL_DIR}  # Use user input or default if input is empty
+
+read -p "Enter the desired logging directory [default: ${DEFAULT_LOG_DIR}], leave empty to use default: " LOG_DIR
+LOG_DIR=${LOG_DIR:-$DEFAULT_LOG_DIR}  # Use user input or default if input is empty
+
+# Export to current session
+export DATA_DIR="$DATA_DIR"
+export LOG_DIR="$LOG_DIR"
+export CAMERA_LABEL_DIR="$CAMERA_LABEL_DIR"
+export PYTHONPATH="$PYTHONPATH"
+
+# Confirm the paths with the user
+echo "Data directory set to: $DATA_DIR"
+echo "Camera label directory set to: $CAMERA_LABEL_DIR"
+echo "Log directory set to: $LOG_DIR"
+
+# Append environment variables to .bashrc
+echo "export DATA_DIR=\"$DATA_DIR\"" >> ~/.bashrc
+echo "export CAMERA_LABEL_DIR=\"$CAMERA_LABEL_DIR\"" >> ~/.bashrc
+echo "export LOG_DIR=\"$LOG_DIR\"" >> ~/.bashrc
+
+echo "Environment variables DATA_DIR, CAMERA_LABEL_DIR and LOG_DIR added to .bashrc and applied to the current session."
+
+##################### WandB #####################
+
+# Prompt the user for input, allowing overrides
+read -p "Enter your WandB entity (username or team name), leave empty to skip: " ENTITY
+
+# Check if ENTITY is not empty
+if [ -n "$ENTITY" ]; then
+  # If ENTITY is not empty, set the environment variable
+  export WANDB_ENTITY="$ENTITY"
+
+  # Confirm the entity with the user
+  echo "WandB entity set to: $WANDB_ENTITY"
+
+  # Append environment variable to .bashrc
+  echo "export WANDB_ENTITY=\"$ENTITY\"" >> ~/.bashrc
+
+  echo "Environment variable WANDB_ENTITY added to .bashrc and applied to the current session."
+else
+  # If ENTITY is empty, skip setting the environment variable
+  echo "No WandB entity provided. Please set wandb=null when running scripts to disable wandb logging and avoid error."
+fi
@@ -0,0 +1,7 @@
+#!/bin/bash
+
+WORK_DIR="${PWD}"
+WINDOW_SIZE=5
+HORIZON=10
+
+python "src/data_processing/window.py" --work_dir "$WORK_DIR"  --window_size "$WINDOW_SIZE"   --horizon "$HORIZON"