mingyuan-zhang
diff --git a/‎README.md
Copy file name to clipboardExpand all lines: README.md
+4-4Lines changed: 4 additions & 4 deletions b/‎README.md
Copy file name to clipboardExpand all lines: README.md
+4-4Lines changed: 4 additions & 4 deletions
diff --git a/‎figures/gallery_t2m/gen_00.gif
Copy file name to clipboard
530 KB b/‎figures/gallery_t2m/gen_00.gif
Copy file name to clipboard
530 KB
diff --git a/‎figures/gallery_t2m/gen_01.gif
Copy file name to clipboard
844 KB b/‎figures/gallery_t2m/gen_01.gif
Copy file name to clipboard
844 KB
diff --git a/‎figures/gallery_t2m/gen_02.gif
Copy file name to clipboard
578 KB b/‎figures/gallery_t2m/gen_02.gif
Copy file name to clipboard
578 KB
diff --git a/‎figures/gallery_t2m/gen_03.gif
Copy file name to clipboard
310 KB b/‎figures/gallery_t2m/gen_03.gif
Copy file name to clipboard
310 KB
diff --git a/‎figures/gallery_t2m/gen_04.gif
Copy file name to clipboard
714 KB b/‎figures/gallery_t2m/gen_04.gif
Copy file name to clipboard
714 KB
diff --git a/‎figures/gallery_t2m/gen_05.gif
Copy file name to clipboard
371 KB b/‎figures/gallery_t2m/gen_05.gif
Copy file name to clipboard
371 KB
diff --git a/‎figures/gallery_t2m/gen_06.gif
Copy file name to clipboard
537 KB b/‎figures/gallery_t2m/gen_06.gif
Copy file name to clipboard
537 KB
diff --git a/‎figures/gallery_t2m/gen_07.gif
Copy file name to clipboard
612 KB b/‎figures/gallery_t2m/gen_07.gif
Copy file name to clipboard
612 KB
diff --git a/‎text2motion/README.md
Copy file name to clipboardExpand all lines: text2motion/README.md
+36Lines changed: 36 additions & 0 deletions b/‎text2motion/README.md
Copy file name to clipboardExpand all lines: text2motion/README.md
+36Lines changed: 36 additions & 0 deletions
diff --git a/‎text2motion/requirements.txt
Copy file name to clipboardExpand all lines: text2motion/requirements.txt
+1-1Lines changed: 1 addition & 1 deletion b/‎text2motion/requirements.txt
Copy file name to clipboardExpand all lines: text2motion/requirements.txt
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎text2motion/tools/visualization.py
Copy file name to clipboard
+80Lines changed: 80 additions & 0 deletions b/‎text2motion/tools/visualization.py
Copy file name to clipboard
+80Lines changed: 80 additions & 0 deletions
@@ -52,6 +52,10 @@ This repository contains the official implementation of _MotionDiffuse: Text-Dri
 
 [10/2022] Code release for text-driven motion generation!
 
+## Text-driven Motion Generation
+
+You may refer to [readme](text2motion/README.md) for detailed introduction.
+
 ## Citation
 
 If you find our work useful for your research, please consider citing the paper:
@@ -65,10 +69,6 @@ If you find our work useful for your research, please consider citing the paper:
 }
 ```
 
-## Text-driven Motion Generation
-
-You may refer to [readme](text2motion/README.md) for detailed introduction.
-
 ## Acknowledgements
 
 This study is supported by NTU NAP, MOE AcRF Tier 2 (T2EP20221-0033), and under the RIE2020 Industry Alignment Fund – Industry Collaboration Projects (IAF-ICP) Funding Initiative, as well as cash and in-kind contribution from the industry partner(s).
@@ -49,6 +49,42 @@ python -u tools/evaluation.py checkpoints/kit/kit_motiondiffuse/opt.txt GPU_ID
 python -u tools/evaluation.py checkpoints/kit/kit_motiondiffuse/opt.txt
 ```
 
+## Visualization
+
+You can visualize human motion with the given language description and the expected motion length.
+
+```shell
+# Currently we only support visualization of models trained on the HumanML3D dataset. 
+# Motion length can not be larger than 196, which is the maximum length during training
+# You can omit `gpu_id` to run visualization on your CPU
+
+python -u tools/visualization.py \
+    --opt_path checkpoints/t2m/t2m_motiondiffuse/opt.txt \
+    --text "a person is jumping" \
+    --motion_length 60 \
+    --result_path "test_sample.gif" \
+    --gpu_id 0
+```
+
+Here are some visualization examples. The motion lengths are shown in the title of animations.
+
+<table>
+<tr>
+    <td><img src="../figures/gallery_t2m/gen_00.gif" width="100%"/></td>
+    <td><img src="../figures/gallery_t2m/gen_01.gif" width="100%"/></td>
+    <td><img src="../figures/gallery_t2m/gen_02.gif" width="100%"/></td>
+    <td><img src="../figures/gallery_t2m/gen_03.gif" width="100%"/></td>
+</tr>
+<tr>
+    <td><img src="../figures/gallery_t2m/gen_04.gif" width="100%"/></td>
+    <td><img src="../figures/gallery_t2m/gen_05.gif" width="100%"/></td>
+    <td><img src="../figures/gallery_t2m/gen_06.gif" width="100%"/></td>
+    <td><img src="../figures/gallery_t2m/gen_07.gif" width="100%"/></td>
+</tr>
+</table>
+
+**Note:** You may install `matplotlib==3.3.1` to support visualization here.
+
 ## Acknowledgement
 
 This code is developed on top of [Generating Diverse and Natural 3D Human Motions from Text](https://github.com/EricGuo5513/text-to-motion)
@@ -2,6 +2,6 @@ tqdm
 opencv-python
 clip
 scipy
-matplotlib
+matplotlib==3.3.1
 spacy
 git+https://github.com/openai/CLIP.git
@@ -0,0 +1,80 @@
+import os
+import torch
+import argparse
+from os.path import join as pjoin
+
+import utils.paramUtil as paramUtil
+from torch.utils.data import DataLoader
+from utils.plot_script import *
+from utils.get_opt import get_opt
+from datasets.evaluator_models import MotionLenEstimatorBiGRU
+
+from trainers import DDPMTrainer
+from models import MotionTransformer
+from utils.word_vectorizer import WordVectorizer, POS_enumerator
+from utils.utils import *
+from utils.motion_process import recover_from_ric
+
+
+def plot_t2m(data, result_path, caption):
+    joint = recover_from_ric(torch.from_numpy(data).float(), opt.joints_num).numpy()
+    # joint = motion_temporal_filter(joint, sigma=1)
+    plot_3d_motion(result_path, paramUtil.t2m_kinematic_chain, joint, title=caption, fps=20)
+
+
+def build_models(opt):
+    encoder = MotionTransformer(
+        input_feats=opt.dim_pose,
+        num_frames=opt.max_motion_length,
+        num_layers=opt.num_layers,
+        latent_dim=opt.latent_dim,
+        no_clip=opt.no_clip,
+        no_eff=opt.no_eff)
+    return encoder
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser()
+    parser.add_argument('--opt_path', type=str, help='Opt path')
+    parser.add_argument('--text', type=str, default="", help='Text description for motion generation')
+    parser.add_argument('--motion_length', type=int, default=60, help='Number of frames for motion generation')
+    parser.add_argument('--result_path', type=str, default="test_sample.gif", help='Path to save generation result')
+    parser.add_argument('--gpu_id', type=int, default=-1, help="which gpu to use")
+    args = parser.parse_args()
+    
+    device = torch.device('cuda:%d' % args.gpu_id if args.gpu_id != -1 else 'cpu')
+    opt = get_opt(args.opt_path, device)
+    opt.do_denoise = True
+
+    assert opt.dataset_name == "t2m"
+    assert args.motion_length <= 196
+    opt.data_root = './dataset/HumanML3D'
+    opt.motion_dir = pjoin(opt.data_root, 'new_joint_vecs')
+    opt.text_dir = pjoin(opt.data_root, 'texts')
+    opt.joints_num = 22
+    opt.dim_pose = 263
+    dim_word = 300
+    dim_pos_ohot = len(POS_enumerator)
+    num_classes = 200 // opt.unit_length
+
+    mean = np.load(pjoin(opt.meta_dir, 'mean.npy'))
+    std = np.load(pjoin(opt.meta_dir, 'std.npy'))
+
+    w_vectorizer = WordVectorizer('./data/glove', 'our_vab')
+    encoder = build_models(opt).cuda()
+    trainer = DDPMTrainer(opt, encoder)
+    trainer.load(pjoin(opt.model_dir, opt.which_epoch + '.tar'))
+
+    trainer.eval_mode()
+    trainer.to(opt.device)
+
+    result_dict = {}
+    with torch.no_grad():
+        if args.motion_length != -1:
+            caption = [args.text]
+            m_lens = torch.LongTensor([args.motion_length]).to(device)
+            pred_motions = trainer.generate(caption, m_lens, opt.dim_pose)
+            motion = pred_motions[0].cpu().numpy()
+            motion = motion * std + mean
+            title = args.text + " #%d" % motion.shape[0]
+            plot_t2m(motion, args.result_path, title)