chunjins
diff --git a/‎.gitignore
+9 b/‎.gitignore
+9
diff --git a/‎README.md
+145 b/‎README.md
+145
diff --git a/‎configs/__init__.py
+21 b/‎configs/__init__.py
+21
diff --git a/‎configs/default.yaml
+131 b/‎configs/default.yaml
+131
@@ -0,0 +1,9 @@
+*.pyc
+__pycache__/
+log
+log/
+data
+data/
+
+submit_sbatch.sh
+sbatch_gpu.sh
@@ -1 +1,146 @@
 # GoMAvatar: Efficient Animatable Human Modeling from Monocular Video Using Gaussians-on-Mesh
+
+CVPR 2024
+
+[Paper]() | [Project Page](https://wenj.github.io/GoMAvatar/)
+
+```bibtex
+@inproceedings{wen2024gomavatar,
+    title={{GoMAvatar: Efficient Animatable Human Modeling from Monocular Video Using Gaussians-on-Mesh}},
+    author={Jing Wen and Xiaoming Zhao and Zhongzheng Ren and Alex Schwing and Shenlong Wang},
+    booktitle={CVPR},
+    year={2024}
+}
+```
+
+## Requirements
+
+Our codes are tested in
+* CUDA 11.6
+* PyTorch 1.13.0
+* PyTorch3D 0.7.0
+
+Install the required packages:
+```Shell
+conda create -n GoMAvatar
+conda activate GoMAvatar
+
+conda install pytorch==1.13.0 torchvision==0.14.0 pytorch-cuda=11.6 -c pytorch -c nvidia
+pip install -r requirements.txt
+
+# install pytorch3d 
+conda install -c fvcore -c iopath -c conda-forge fvcore iopath
+conda install pytorch3d -c pytorch3d
+
+# install gaussian splatting
+pip install git+"https://github.com/graphdeco-inria/diff-gaussian-rasterization"
+```
+
+## Data preparation
+### Prerequisites
+Download SMPL v1.0.0 models from [here](https://smpl.is.tue.mpg.de/download.php) and put the `.pkl` files under `utils/smpl/models`.
+You may need to remove the Chumpy objects following [here](https://github.com/vchoutas/smplx/tree/main/tools).
+
+### ZJU-MoCap
+
+First download the [ZJU-MoCap](https://github.com/zju3dv/neuralbody/blob/master/INSTALL.md#zju-mocap-dataset) dataset and save the raw data under `data/zju-mocap`.
+
+Run the following script to preprocess the dataset:
+```Shell
+cd scripts/prepare_zju-mocap
+python prepare_dataset.py --cfg "$SCENE".yaml
+```
+Change `$SCENE` to one of 377, 386, 387, 392, 393, 394.
+
+The folder will be in the following structure:
+```Shell
+├── data
+    ├── zju-mocap
+        ├── 377
+        ├── 386
+        ├── ...
+        ├── CoreView_377
+        ├── CoreView_386
+        ├── ...
+```
+Folders named after scene ID only are preprocessed training data, while those prefixed with `CoreView_` are raw data. 
+
+### PeopleSnapshot
+
+Download the [PeopleSnapshot](https://graphics.tu-bs.de/people-snapshot) dataset and save the files under `data/snapshot`.
+
+Download the refined training poses from [here](https://github.com/tijiang13/InstantAvatar/tree/master/data/PeopleSnapshot). 
+
+Run the following script to preprocess the training and test set.
+```Shell
+cd scripts/prepare_snapshot
+python prepare_dataset.py --cfg "$SCENE".yaml # training set
+python prepare_dataset.py --cfg "$SCENE"_test.yaml # test set
+```
+`$SCENE` is one of `female-3-casual`, `female-4-casual`, `male-3-casual` and `male-4-casual`.
+
+After the preprocessing, the folder will be in the following structure:
+```Shell
+├── data
+    ├── snapshot
+        ├── f3c_train
+        ├── f3c_test
+        ├── f4c_train
+        ├── f4c_test
+        ├── ...
+        ├── female-3-casual
+        ├── female-4-casual
+        ├── ...
+        ├── poses # refined training poses
+            ├── female-3-casual
+                ├── poses
+                    ├── anim_nerf_test.npz
+                    ├── anim_nerf_train.npz
+                    ├── anim_nerf_val.npz
+            ├── ...
+        
+```
+Folders ended with `_train` or `_test` are preprocessed data.
+
+## Rendering and evaluation
+
+We provide the pretrained checkpoints in this [link](https://uofi.box.com/s/onwfp29ej03sr2ci7mm59nu74v6i0ip3). To reproduce the rendering results in the paper, run
+```Shell
+# ZJU-MoCap novel view synthesis
+python eval.py --cfg exps/zju-mocap_"$SCENE".yaml --type view
+
+# ZJU-MoCap novel pose synthesis
+python eval.py --cfg exps/zju-mocap_"$SCENE".yaml --type pose
+```
+On the PeopleSnapshot dataset, we follow [Anim-NeRF](https://github.com/JanaldoChen/Anim-NeRF) and [InstantAvatar](https://github.com/tijiang13/InstantAvatar) to refine test poses:
+```Shell
+python train_pose.py --cfg exps/snapshot_"$SCENE".yaml
+```
+Please check `exps/` for detailed configuration files.
+
+You can run 360 degree freeview rendering using the following command
+```Shell
+python eval.py --cfg exps/zju-mocap_"$SCENE".yaml --type freeview
+```
+Use `--frame_idx` to specify the training frame id and `--n_frames` to set the number of views.
+
+Or you can render novel poses from [MDM](https://guytevet.github.io/mdm-page/):
+```Shell
+python eval.py --cfg exps/zju-mocap_"$SCENE".yaml --type pose_mdm --pose_path data/mdm_poses/sample.npy
+```
+We provide an example of pose trajectory in `data/pose_mdm/sample.npy`.
+
+## Training
+
+Run the following command to train from scratch:
+```Shell
+# ZJU-MoCap
+python train.py --cfg exps/zju-mocap_"$SCENE".yaml
+
+# PeopleSnapshot
+python train.py --cfg exps/snapshot_"$SCENE".yaml
+```
+
+## Acknowledgements
+
+This project builds upon [HumanNeRF](https://github.com/chungyiweng/humannerf) and [MonoHuman](https://github.com/Yzmblog/MonoHuman/tree/main). We appreciate the authors for their great work!
@@ -0,0 +1,21 @@
+import os
+import argparse
+
+import torch
+
+from .yacs import CfgNode as CN
+
+
+# pylint: disable=redefined-outer-name
+
+
+def make_cfg(cfg_filename):
+	cfg = CN()
+	cfg.merge_from_file('configs/default.yaml')
+	if cfg_filename is not None:
+		cfg.merge_from_file(cfg_filename)
+
+	log_root = 'log' if not hasattr(cfg, 'save_dir') else cfg.save_dir
+	cfg.save_dir = os.path.join(log_root, cfg.exp_name)
+
+	return cfg
@@ -0,0 +1,131 @@
+exp_name: "default"
+
+bgcolor: [255., 255., 255.]
+random_bgcolor: true
+img_size: [512, 512]
+
+dataset:
+  train:
+    dataset_path: "dataset/zju_mocap/387"
+    batch_size: 1
+    num_workers: 1
+
+    skip: 1
+    maxframes: -1
+    split_for_pose: false # if true, leave 1/5 frames for novel pose evaluation (monohuman's split)
+
+    crop_size: [-1, -1]
+    prefetch: false
+
+  test_view:
+    name: "zju-mocap"
+    dataset_path: "dataset/zju_mocap/387"
+    raw_dataset_path: "dataset/zju_mocap/CoreView_387"
+    batch_size: 1
+    num_workers: 1
+
+    skip: 1
+    maxframes: -1
+
+    exclude_view: 0
+
+  test_pose:
+    dataset_path: "dataset/zju_mocap/387"
+    raw_dataset_path: "dataset/zju_mocap/CoreView_387"
+    batch_size: 1
+    num_workers: 1
+
+  test_pose_mdm:
+    dataset_path: "dataset/zju_mocap/387"
+    pose_path: "data/pose_mdm/row00_col00_smpl_params.npy"
+    batch_size: 1
+    num_workers: 1
+    format: 'mdm'
+
+  test_on_train:
+    batch_size: 1
+    num_workers: 1
+
+  test_freeview:
+    dataset_path: "dataset/zju_mocap/387"
+    batch_size: 1
+    num_workers: 1
+    src_type: 'zju_mocap'
+
+model:
+  # basic info, override all modules
+  img_size: [512, 512]
+  subdivide_iters: []
+  eval_mode: false
+
+  appearance:
+    face_color: true
+    color_init: 0.5
+
+  canonical_geometry:
+    radius_scale: 1.0
+    deform_scale: false
+    deform_so3: false
+
+    sigma: 0.001
+
+  lbs_weights:
+    refine: false
+
+  renderer:
+    name: 'gaussian'
+
+  pose_refinement:
+    name: 'none'
+
+  non_rigid:
+    name: 'none'
+
+  normal_renderer:
+    name: 'none'
+
+  shadow_module:
+    name: 'none'
+
+train:
+  optim: 'adam'
+  lr:
+    lbs_weights: 0.0
+    appearance: 0.005
+    canonical_geometry: 0.005
+    canonical_geometry_xyz: 0.005
+    non_rigid: 0.005
+    pose_refinement: 0.0005
+    shadow: 0.005
+
+  losses:
+    rgb:
+      coeff: 1.0
+
+    mask:
+      coeff: 5.0
+
+    lpips:
+      coeff: 1.0
+
+    laplacian:
+      coeff_canonical: 0.0
+      coeff_observation: 0.0
+
+    normal:
+      coeff_consist: 0.0
+
+      mask_dilate: false
+      coeff_mask: 0.0
+
+    color_consist:
+      coeff: 0.0
+
+  total_iters: 30000
+  lr_update_exp: true
+  lr_decay_steps: 100000
+
+  log_freq: 10
+  tb_freq: 100
+  save_freq: 1000
+  eval_freq: 50000