diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..6ec318b
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,171 @@
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+.pybuilder/
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/#use-with-ide
+.pdm.toml
+
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Pyre type checker
+.pyre/
+
+# pytype static type analyzer
+.pytype/
+
+# Cython debug symbols
+cython_debug/
+
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/
+
+/test*
+/hf_space
+/.vscode
+/BLINK_Benchmark
+/checkpoints
+/data
+/*.egg-info
+
+
+/templates/
\ No newline at end of file
diff --git a/LICENSE b/LICENSE
deleted file mode 100644
index 25a1149..0000000
--- a/LICENSE
+++ /dev/null
@@ -1,21 +0,0 @@
-MIT License
-
-Copyright (c) 2024 TIGER Lab
-
-Permission is hereby granted, free of charge, to any person obtaining a copy
-of this software and associated documentation files (the "Software"), to deal
-in the Software without restriction, including without limitation the rights
-to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
-copies of the Software, and to permit persons to whom the Software is
-furnished to do so, subject to the following conditions:
-
-The above copyright notice and this permission notice shall be included in all
-copies or substantial portions of the Software.
-
-THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
-IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
-FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
-AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
-LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
-OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-SOFTWARE.
diff --git a/README.md b/README.md
deleted file mode 100644
index a6ae20e..0000000
--- a/README.md
+++ /dev/null
@@ -1,2 +0,0 @@
-# MantisScore
-official repo for "MantisScore: A Reliable Fine-grained Metric for Video Generation"
diff --git a/emnlp_pre/VideoScore_Xuan_He.pdf b/emnlp_pre/VideoScore_Xuan_He.pdf
new file mode 100644
index 0000000..7beffa8
Binary files /dev/null and b/emnlp_pre/VideoScore_Xuan_He.pdf differ
diff --git a/emnlp_pre/VideoScore_poster.pdf b/emnlp_pre/VideoScore_poster.pdf
new file mode 100644
index 0000000..0fe5eff
Binary files /dev/null and b/emnlp_pre/VideoScore_poster.pdf differ
diff --git a/emnlp_pre/a.txt b/emnlp_pre/a.txt
new file mode 100644
index 0000000..8b13789
--- /dev/null
+++ b/emnlp_pre/a.txt
@@ -0,0 +1 @@
+
diff --git a/index.html b/index.html
new file mode 100644
index 0000000..f109def
--- /dev/null
+++ b/index.html
@@ -0,0 +1,1143 @@
+
+<!DOCTYPE html>
+<html>
+
+<head>
+  <meta charset="utf-8">
+  <meta name="description" content="text-to-video generation evaluation">
+  <meta name="keywords" content="multimodal evaluation">
+  <meta name="viewport" content="width=device-width, initial-scale=1">
+  <title>VideoScore</title>
+
+  <link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro">
+  <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bulma@0.9.1/css/bulma.min.css">
+  <link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/bootstrap/4.5.2/css/bootstrap.min.css">
+  <link rel="stylesheet" href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
+  <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.1/css/all.min.css">
+  <link rel="stylesheet" href="./static/css/index.css">
+  <link href="https://fonts.googleapis.com/icon?family=Material+Icons" rel="stylesheet">
+
+  <link rel="icon" href="static/images/logo.png?v=4">
+
+  <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
+  <script defer src="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.1/js/all.min.js"></script>
+  <script type="module" src="https://gradio.s3-us-west-2.amazonaws.com/4.16.0/gradio.js"></script>
+</head>
+
+<style>
+  .text-with-background {
+      padding: 1rem; 
+      border-radius: 5px; 
+      box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1); 
+    }
+    .gif-container {
+      display: flex;
+      flex-direction: column;
+      align-items: center;
+      margin-bottom: 2rem; 
+    }
+    .gif-wrapper {
+      width: 80%;
+      height: 200px; 
+      display: flex;
+      justify-content: center;
+      align-items: center;
+      background-color: #f5f5f5; 
+    }
+    .gif-wrapper img {
+      max-height: 100%;
+      max-width: 100%;
+      object-fit: contain; 
+    }
+  .expandable-card .card-text-container {
+    max-height: 200px;
+    overflow-y: hidden;
+    position: relative;
+  }
+
+  .expandable-card.expanded .card-text-container {
+    max-height: none;
+  }
+
+  .expand-btn {
+    position: relative;
+    display: none;
+    background-color: rgba(255, 255, 255, 0.8);
+    /* margin-top: -20px; */
+    /* justify-content: center; */
+    color: #510c75;
+    border-color: transparent;
+  }
+
+  .expand-btn:hover {
+    background-color: rgba(200, 200, 200, 0.8);
+    text-decoration: none;
+    border-color: transparent;
+    color: #510c75;
+  }
+
+  .expand-btn:focus {
+    outline: none;
+    text-decoration: none;
+  }
+
+  .expandable-card:not(.expanded) .card-text-container:after {
+    content: "";
+    position: absolute;
+    bottom: 0;
+    left: 0;
+    width: 100%;
+    height: 90px;
+    background: linear-gradient(rgba(255, 255, 255, 0.2), rgba(255, 255, 255, 1));
+  }
+
+  .expandable-card:not(.expanded) .expand-btn {
+    margin-top: -40px;
+  }
+
+  .card-body {
+    padding-bottom: 5px;
+  }
+
+  .vertical-flex-layout {
+    justify-content: center;
+    align-items: center;
+    height: 100%;
+    display: flex;
+    flex-direction: column;
+    gap: 5px;
+  }
+
+  .figure-img {
+    max-width: 100%;
+    height: auto;
+  }
+
+  .adjustable-font-size {
+    font-size: calc(0.5rem + 2vw);
+  }
+
+  .chat-history {
+    flex-grow: 1;
+    overflow-y: auto;
+    /* overflow-x: hidden; */
+    padding: 5px;
+    border-bottom: 1px solid #ccc;
+    margin-bottom: 10px;
+  }
+
+  #gradio pre {
+    background-color: transparent;
+  }
+</style>
+
+<body>
+
+<!----------------------------------------- Title and Authors. --------------------------------------------------->
+<section class="hero">
+    <div class="hero-body">
+      <div class="container is-max-desktop">
+        <div class="columns is-centered">
+          <div class="column has-text-centered">
+            <h1 class="title is-1 publication-title is-bold">
+              <img id="painting_icon" width="5%" src="static/images/logo.png">
+              VideoScore </h1>
+              <h2 class="subtitle is-3 publication-subtitle"> Building Automatic Metrics to Simulate Fine-grained Human Feedback for Video Generation</h2>
+              <br> 
+              <div class="is-size-5 publication-authors">
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup><sup>,</sup><sup style="color:#007bff;">2</sup><sup>,†</sup>
+                    <a href="" style="font-weight:normal;">Xuan He*</a>,
+                  </span>
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup><sup>,†</sup>
+                    <a href="https://jdf-prog.github.io/" style="font-weight:normal;">Dongfu Jiang*</a>,
+                  </span>
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup><sup>,</sup><sup style="color:#ed4b82;">3</sup>
+                    <a href="" style="font-weight:normal;">Ge Zhang</a>,
+                  </span>
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup>
+                    <a href="https://kuwingfung.github.io/" style="font-weight:normal;">Max Ku</a>,
+                  </span>
+                  <br>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Achint Soni,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Sherman Siu,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Haonan Chen,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Abhranil Chandra,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Ziyan Jiang,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Aaran Arulraj,</span>
+                  <sup style="color:#9b51e0;">4</sup><span class="author-block">Kai Wang,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Quy Duc Do,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Yuansheng Ni,</span>
+                  <sup style="color:#007bff;">2</sup><span class="author-block">Bohan Lyu,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Yaswanth Narsupalli,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Rongqi Fan,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Zhiheng Lyu,</span>
+                  <span class="author-block">
+                    <sup style="color:#6fbf73;">5</sup><a href="https://yuchenlin.xyz/" style="font-weight:normal;">Bill Yuchen Lin</a>,
+                  </span>
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup><sup>,†</sup>
+                    <a href="https://wenhuchen.github.io/" style="font-weight:normal;">Wenhu Chen</a>
+                  </span>
+              </div>  
+            <br>           
+            <div class="is-size-5 publication-authors">
+                <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup>University of Waterloo, 
+                    <sup style="color:#007bff;">2</sup>Tsinghua University, 
+                    <sup style="color:#ed4b82;">3</sup>StarDust.AI, 
+                    <sup style="color:#9b51e0;">4</sup>University of Toronto, 
+                    <sup style="color:#6fbf73;">5</sup>AI2          
+                </span>
+            </div>  
+            <br>   
+            <div class="is-size-5 publication-authors">
+              <span class="author-block">
+                    *Equal Contribution
+              </span>
+            </div>
+            <div class="is-size-5 publication-authors">
+                <span class="author-block">†Corresponding to:</span>
+                <span class="author-block"><a href="mailto:hexuan21@mails.tsinghua.edu.cn">hexuan21@mails.tsinghua.edu.cn</a>,</span>
+                <span class="author-block"><a href="mailto:dongfu.jiang@uwaterloo.ca">dongfu.jiang@uwaterloo.ca</a>,</span>
+                <span class="author-block"><a href="mailto:wenhuchen@uwaterloo.ca">wenhuchen@uwaterloo.ca</a></span>
+            </div>
+
+            <div class="column has-text-centered">
+              <div class="publication-links">
+                <span class="link-block">
+                  <a href="https://arxiv.org/abs/2406.15252" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      <i class="ai ai-arxiv"></i>
+                    </span>
+                    <span>Paper</span>
+                  </a>
+                </span>
+
+                <span class="link-block">
+                  <a href="https://github.com/TIGER-AI-Lab/VideoScore/" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      <i class="fab fa-github"></i>
+                    </span>
+                    <span>Code</span>
+                  </a>
+                </span>
+
+                <span class="link-block">
+                  <a href="https://huggingface.co/datasets/TIGER-Lab/VideoFeedback" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      <i class="fas fa-database"></i>
+                    </span>
+                    <span>VideoFeedback</span>
+                  </a>
+                </span>
+
+                <span class="link-block">
+                  <a href="https://huggingface.co/datasets/TIGER-Lab/VideoScore-Bench" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      <i class="fas fa-database"></i>
+                    </span>
+                    <span>VideoScore-Bench</span>
+                  </a>
+                </span>
+
+                <span class="link-block">
+                  <a href="https://huggingface.co/TIGER-Lab/VideoScore" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      🔥 
+                    </span>
+                    <span>Model</span>
+                  </a>
+                </span>
+                <br>
+                
+                <span class="link-block">
+                  <a href="https://huggingface.co/spaces/TIGER-Lab/VideoScore-Leaderboard" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      🤗
+                    </span>
+                    <span>Leaderboard</span>
+                  </a>
+                </span>
+
+                <span class="link-block">
+                  <a href="https://huggingface.co/spaces/TIGER-Lab/VideoScore" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      🤗
+                    </span>
+                    <span>Space</span>
+                  </a>
+                </span>
+
+                
+
+                <span class="link-block">
+                  <a href="https://twitter.com/DongfuJiang/status/1805438506137010326"
+                   class="external-link button is-normal is-rounded is-dark">
+                  <span class="icon has-text-white">
+                    <i class="fab fa-twitter"></i>
+                  </span>
+                  <span>Twitter</span>
+                </a>
+              </span>
+
+              </div>
+            </div>
+
+            <centering>
+              <div style="text-align: center;">
+                <img id="teaser" width="85%" src="static/images/teaser.png">     
+              </div>
+            </centering> 
+
+          </div>
+        </div>
+      </div>
+    </div>
+  </section>
+
+
+
+<!----------------------------------------- Abstract. --------------------------------------------------->
+  <section class="hero is-light is-small">
+  <div class="hero-body has-text-centered">
+    <h2 class="title is-3"> 
+      Abstract</h2>
+  </div>
+  </section>
+
+  <section class="section">
+    <div class="container is-max-desktop">
+      <!-- Abstract. -->
+      <div class="columns is-centered has-text-centered">
+        <div class="column is-four-fifths">
+           
+          <div class="content has-text-justified">
+            <p>
+              The recent years have witnessed great advances
+              in video generation. However, the development
+              of automatic video metrics is lagging significantly behind. None of the existing metric is
+              able to provide reliable scores over generated
+              videos. The main barrier is <b>the lack of large-scale human-annotated dataset</b>.
+              <ol type="I">
+                <li>
+                  <img id="painting_icon" width="3%" src="static/images/data_logo4.png">
+                  <b>VideoFeedback Dataset</b>.
+                  In this paper, we release VideoFeedback, the first large-scale dataset 
+                  containing human-provided multiaspect score over 37.6K synthesized videos
+                  from 11 existing video generative models. 
+                </li>
+                <li>
+                  <img id="painting_icon" width="3%" src="static/images/logo.png">
+                  <b>VideoScore</b>. 
+                    We train VideoScore (initialized from Mantis) based on VideoFeedback 
+                    to enable automatic video quality assessment. Experiments
+                    show that the Spearman correlation between
+                    VideoScore and humans can reach 77.1 on
+                    VideoFeedback-test, beating the prior best
+                    metrics by about 50 points. Further result on
+                    other held-out EvalCrafter, GenAI-Bench, and
+                    VBench show that VideoScore has consistently much higher correlation with human
+                    judges than other metrics. 
+                    
+                </li>
+                <li><b>Human Feedback for Video generative models</b>. 
+                    Due to these results, we believe VideoScore can serve as
+                    a great proxy for human raters to (1) rate different video models to track progress (2) simulate
+                    fine-grained human feedback in Reinforcement
+                    Learning with Human Feedback (RLHF) to improve current video generation models.
+                </li>
+              </ol>                
+            </p>
+  
+          </div>
+        </div>
+      </div>
+    </div>
+  </section>
+
+
+
+
+
+<!----------------------------------------- VideoFeedback Dataset. --------------------------------------------------->
+<section class="hero is-light is-small">
+  <div class="hero-body has-text-centered">
+    <h2 class="title is-3">
+      <img id="painting_icon" width="3%" src="static/images/data_logo4.png">
+           VideoFeedback Dataset <br> Multi-Aspect Human-Annotated Video Evaluation Data</h2>
+  </div>
+</section> 
+
+<section class="section">
+  <div class="container is-max-desktop">
+    <div class="columns is-centered has-text-centered">
+      <div class="column is-full-width">
+        <div class="content has-text-justified has-text-centered">
+          <p>
+                VideoFeedback contains a total of <b>37.6K</b> text-to-video pairs from 11 popular video generative models, 
+                with some real-world videos as data augmentation. 
+                The videos are annotated by raters for five evaluation dimensions: <b>Visual Quality (VQ)</b>, <b>Temporal Consistency (TC)</b>, <b>(DD) Dynamic Degree (DD)</b>,
+                 <b>Text-to-Video Alignment (TVA)</b> and <b>Factual Consistency (FC)</b>, 
+                in 1-4 scoring scale. Below we show the detailed description of our VideoFeedback dataset.
+                Please check out 
+                <a href="https://huggingface.co/datasets/TIGER-Lab/VideoEval">🤗 <b>VideoFeedback</b></a> 
+                on hugging face datasets for usage.
+
+              <p></p>
+
+              <centering>
+                <div style="text-align: center;">
+                    <h3 class="title is-4">Statistics</h3>
+                    <img id="dataset" width="75%" src="static/images/dataset.png">     
+                <div
+              </centering>
+          </p>
+        </div>
+      </div>
+    </div>
+
+    <div class="columns is-centered has-text-centered">
+      <div class="column is-full-width">
+          <h3 class="title is-4">Dimensions of Evaluation</h3>
+          <img id="dataset" width="75%" src="static/images/subscore_def.png">   
+      </div>
+    </div>
+
+
+    <div class="columns is-centered has-text-centered">
+      <div class="column is-full-width">
+          <h3 class="title is-4">Annotation Examples</h3>
+          <b style="color:#df2919;">1-Bad</b>, <b style="color:#e1b00e;">2-Average</b>, 
+            <b style="color:#007bff;">3-Good</b>, <b style="color:#3ec56b;">4-Real/Perfect</b><br>
+      </div>
+    </div>
+
+        <hr style="height: 2px; background: #333">
+    <div class="container">
+      <div class="columns is-multiline">
+        <!-- Row 1 -->
+        <!-- 1, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/0004577.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: completely base your choice of which one to visit today on the dish that most entices your taste buds, 1080P, high quality, comic
+              <br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>3</td><td>3</td><td>1</td><td>3</td><td>3</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 1, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/1005886.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: an African American female video editor editing videos<br><br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>1</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+
+          </div>
+        </div>
+        <!-- 1, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/2003040.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: Cinematic, A light rain is falling. Tea pickers are picking tea in a tea garden, 4K, anime style<br><br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>3</td><td>2</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- Row 2 -->
+        <!-- 2, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/3003666.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: crypto new year Christmas santa money dollars pack<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>2</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 2, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/4004440.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: Woman receiving a rose and blushing with a smile<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>2</td><td>2</td><td>3</td><td>3</td><td>2</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 2, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/5001175.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: panorama gold coast city  in future as a dystopian prison<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>2</td><td>3</td><td>3</td><td>2</td><td>3</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- Row 3 -->
+        <!-- 3, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/6003973.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: little bear looks surprised as the moon gets smaller<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>2</td><td>3</td><td>1</td><td>2</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 3, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/7003198.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: alexandra daddario, upperbody focus, slow motion, cinematic<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>2</td><td>2</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        
+        <!-- 3, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/8001892.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: cinematic portrait of two dogs running away from a medieval man<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>2</td><td>3</td><td>2</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- Row 4 -->
+        <!-- 4, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/9000974.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: a skateboard on the bottom of a surfboard, front view<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>3</td><td>3</td><td>3</td><td>3</td><td>2</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 4, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/p005353.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: yellow van with trailer starts to back up<br><br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>4</td><td>4</td><td>4</td><td>4</td><td>4</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 4, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/eg_videos/s000907.gif" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: five gray wolf pups frolicking and chasing each other around a remote gravel road, surrounded by grass. The pups run and leap, chasing each other, and nipping at each other, playing<br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>4</td><td>2</td><td>4</td><td>2</td><td>4</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+
+      </div>
+    </div>
+    <hr style="height: 2px; background: #333">
+
+
+  </div>  
+
+  </section>        
+ 
+<!----------------------------------------- VideoScore. --------------------------------------------------->  
+<section class="hero is-light is-small">
+  <div class="hero-body has-text-centered">
+  <h2 class="title is-3">
+    <img id="painting_icon" width="3%" src="static/images/logo.png">
+    <span style="vertical-align: middle">VideoScore</span>
+  </h2>
+  </div>
+</section>  
+
+<section class="section"> 
+  <div class="container is-max-desktop">
+    <div class="columns is-centered">
+      <div class="column is-full-width">
+        <div class="content has-text-justified"> 
+          <p>
+            VideoScore is finetuned on VideoFeedback dataset's 37K training set taking 
+            <a href="https://huggingface.co/openai/clip-vit-large-patch14-336">Mantis-8B-Idefics2</a> as base model. 
+            We try generation scoring method and regression scoring method, 
+            the former one means model's answer is in a template 
+            predefined for video quality evaluation 
+            while the latter one outputs 5 logits as evaluation scores in 5 dimensions.
+         
+            Besides, we also make ablation on base model, using 
+            <a href="https://huggingface.co/openai/clip-vit-large-patch14-336">Mantis-8B-Idefics2</a>, 
+            <a href="https://huggingface.co/HuggingFaceM4/idefics2-8b">Idefics2-8B</a>
+             and 
+             <a href="https://huggingface.co/LanguageBind/Video-LLaVA-7B">VideoLLaVA-7B </a>
+            as base models to finetune. Mantis-8B-Idefics2 turns out to 
+            have the best performance on video quality evaluation.
+          </p>
+        </div>          
+      </div>
+    </div>
+  </div>
+
+  <div class="hero-body has-text-centered">
+    <h2 class="title is-4">
+      <span style="vertical-align: middle">Video Evaluation Benchmarks</span>
+    </h2>
+  </div>
+  <div class="container is-max-desktop">
+    <div class="columns is-centered">
+      <div class="column is-full-width">
+        <h2 class="title is-5"><span style="font-size: 100%;">
+          <img id="painting_icon" width="3%" src="static/images/data_logo4.png">
+          VideoFeedback-test</span></h2>
+        <p>
+          We test VideoScore on VideoFeedback-test set, containing 760 videos with human scores from five dimensions. 
+          We take the Spearman correlation between VideoScore and human annotation as performance indicator. 
+          Below we show the results of some feature-based metrics like PIQE, CLIP-sim, X-CILIP-Sore etc, and some
+          MLLM-prompting methods like GPT-4o Gemini-1.5-Pro, etc and our VideoScore. 
+        </p>
+        <br>
+        <h2 class="title is-5"><span style="font-size: 100%;">
+          <img id="painting_icon" width="3%" src="static/images/ec_icon.png">
+          EvalCrafter Benchmark</span></h2>
+        <p>
+          We select 3 dimensions (Visual Quality, Temporal Consistency and Text-to-Video Alignment) 
+          from EvalCrafter that match our evaluation aspects 
+          and collect 2500+ videos for test. 
+          We take the Spearman correlation between VideoScore and human annotation as performance indicator.
+
+        </p>
+        <br>
+        <h2 class="title is-5"><span style="font-size: 100%;">⚔️GenAI-Bench and VBench</span></h2>
+        <p>
+            GenAI-Bench is a multimodal benchmark for MLLM's capability on preference comparison
+            for tasks like text-to-video generation, image-editing and others, while 
+            VBench is a comprehensive multi-aspect benchmark suite for
+            video generative models. <br>
+            For GenAI-Bench we collect 2100+ videos in test and 
+            for VBench we select a subset from 5 aspects of VBench, like technical 
+            quality, subject consistency etc, then subsample 100 unique prompts for four T2V models (2000 videos totally) for test.
+            We use averaged score of our five dimensions for MLLM prompting baselines and VideoScore to
+            give the preference and calculate the pairwise accuracy as performance indicator.
+        </p>
+        <!--<centering>
+          <div style="text-align: center;">
+              <img id="res_video_eval" width="75%" src="static/images/res_video_eval.png">     
+          </div>
+        </centering>-->
+      </div>
+    </div>
+  </div>
+
+  <div class="hero-body has-text-centered">
+    <h2 class="title is-4">
+      <span style="vertical-align: middle">Results & Leaderboard</span>
+    </h2>
+  </div>
+
+  <div class="container is-max-desktop">
+    <div class="columns is-centered">
+      <div class="column is-four-fifths has-text-centered">
+        
+          <div class="model-labels-container is-size-5">
+
+            <span style="background-color: rgba(110, 194, 134, 0.15);padding: 5px 10px;">VideoScore series</span>
+            <span style="background-color: rgba(255, 208, 80, 0.15);padding: 5px 10px;">MLLM Prompting Method</span>
+            <span style="background-color: rgba(42, 149, 235, 0.15);padding: 5px 10px;">Feature-Based Metric</span>
+            <p></p>
+          </div>
+
+        <table class="table is-bordered is-three-fifths">
+          <thead>
+            <tr style="background-color: rgba(211, 211, 211, 0.5);">
+              <th>Metric</th>
+              <th>Final Avg Score ↓</th>
+              <th>VideoFeedback-test</th>
+              <th>EvalCrafter</th>
+              <th>GenAI-Bench</th>
+              <th>VBench</th>
+            </tr>
+          </thead>
+          <tbody>
+            <tr style="background-color: rgba(110, 194, 134, 0.15);">
+              <td>VideoScore (reg)</td><td><b>69.6</b></td><td>75.7</td><td><b>51.1</b></td><td><b>78.5</b></td><td><b>73.0</b></td></tr>
+            
+            <tr style="background-color: rgba(110, 194, 134, 0.15);">
+              <td>VideoScore-(gen)</td><td>55.6</td><td><b>77.1</b></td><td>27.6</td><td>59.0</td><td>58.7</td></tr>
+            
+            <!--<tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>∆ over Best Baseline</td><td>119.5</td> <td>54.0</td><td>14.9</td><td>11.4</td><td>17.9</td></tr>-->
+
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Gemini-1.5-Pro</td><td><u>39.7</u></td><td>22.1</td><td>22.9</td><td>60.9</td><td>52.9</td></tr>
+              
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Gemini-1.5-Flash</td><td>39.4</td><td>20.8</td><td>17.3</td><td><u>67.1</u></td><td>52.3</td></tr>
+              
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>GPT-4o</td><td>38.9</td><td><u>23.1</u></td><td>28.7</td><td>52.0</td><td>51.7</td></tr>
+
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>CLIP-sim</td><td>31.7</td><td>8.9</td><td><u>36.2</u></td><td>34.2</td><td>47.4</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>DINO-sim</td><td>30.3</td><td>7.5</td><td>32.1</td><td>38.5</td><td>43.3</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>SSIM-sim</td><td>29.5</td><td>13.4</td><td>26.9</td><td>34.1</td><td>43.5</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>CLIP-Score</td><td>28.6</td><td>-7.2</td><td>21.7</td><td>45.0</td><td>54.9</td></tr>
+
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>LLaVA-1.5-7B</td><td>27.1</td><td>8.5</td><td>10.5</td><td>49.9</td><td>39.4</td></tr>
+            
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>LLaVA-1.6-7B</td><td>23.3</td><td>-3.1</td><td>13.2</td><td>44.5</td><td>38.7</td></tr>
+
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>X-CLIP-Score</td><td>23.2</td><td>-1.9</td><td>13.3</td><td>41.4</td><td>40.1</td></tr>
+
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>PIQE</td><td>19.6</td><td>-10.1</td><td>-1.2</td><td>34.5</td><td><u>55.1</u></td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>BRISQUE</td><td>19.0</td><td>-20.3</td><td>3.9</td><td>38.5</td><td>53.7</td></tr>
+            
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Idefics1</td><td>18.3</td><td>6.5</td><td>0.3</td><td>34.6</td><td>31.7</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>MSE-dyn</td><td>10.6</td><td>-5.5</td><td>-17.0</td><td>28.4</td><td>36.5</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>SSIM-dyn</td><td>9.2</td><td>-12.9</td><td>-26.4</td><td>31.4</td><td>44.5</td></tr>
+
+            <!-- <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Fuyu</td><td>-</td><td>-</td><td>-</td><td>-</td><td>-</td></tr>
+            
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Kosmos-2</td><td>-</td><td>-</td><td>-</td><td>-</td><td>-</td></tr>
+            
+              <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>CogVLM</td><td>-</td><td>-</td><td>-</td><td>-</td><td>-</td></tr>
+            
+              <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>OpenFlamingo</td><td>-</td><td>-</td><td>-</td><td>-</td><td>-</td></tr> -->
+
+          </tbody>
+        </table>
+        <p style="text-align:center">
+          The best VideoScore is <b>in bold</b> and the best in baselines is <u>underlined</u>. 
+          <!--"-" means the answer of MLLM is meaningless or in wrong format. -->
+        </p>
+      </div>
+    </div>
+  </div>
+    
+</section>
+
+<section class="hero is-light is-small">
+  <div class="hero-body has-text-centered">
+  <h2 class="title is-3">
+    <span style="vertical-align: middle">Case Studies</span>
+  </h2>
+  </div>
+</section>  
+
+<section>
+    <div class="hero-body has-text-centered">
+      <h2 class="title is-4">
+        <span style="vertical-align: middle">
+          <img id="painting_icon" width="3%" src="static/images/data_logo4.png">
+            VideoFeedback-test</span></h2></span>
+      </h2>
+    </div>
+    <div class="container is-max-desktop">
+      <div class="columns is-centered">
+        <div class="column is-full-width">
+            <p style="text-align:center">
+              Scale of all the scores is in [1, 2, 3, 4] except for VideoScore (reg), 
+              which outputs five float logits ranging from 0.50 to 4.50. <br>
+              For scale [1, 2, 3, 4], 1-Bad, 2-Avg, 3-Good, 4-Perfect/Real. <br>
+
+
+            </p>
+        </div>
+      </div>
+
+      <div class="columns is-multiline">
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/case_study/5000217.gif" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              prompt: A robot that throws a stack of paper from a desk
+            </p>
+          </div>
+        </div>
+
+        <div class="column is-two-thirds">
+            <table class="table is-full-width is-striped is-size-7">
+              <thead>
+                <tr style="background-color: rgba(180, 180, 180, 0.15);">
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr>
+              </thead>
+              <tbody>
+                  <tr style="background-color: rgba(245, 123, 113, 0.15);">
+                    <td>Human score</td><td>3</td><td>1</td><td>3</td><td>3</td><td>1</td>
+                    <td></td><td></td><td></td><td></td><td></td><td></td>
+                  </tr>
+                  <tr style="background-color: rgba(110, 194, 134, 0.15);">
+                    <td>VideoScore (reg)</td><td>2.67</td><td>0.81</td><td>3.09</td><td>2.50</td><td>0.80</td>
+                    <td>VideoScore (gen)</td><td>3</td><td>1</td><td>3</td><td>3</td><td>1</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>GPT-4o</td><td>3</td><td>4</td><td>2</td><td>3</td><td>4</td>
+                    <td>Gemini-1.5-Pro</td><td>3</td><td>1</td><td>1</td><td>3</td><td>3</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>Gemini-1.5-Flash</td><td>3</td><td>1</td><td>1</td><td>3</td><td>3</td>
+                    <td>LLaVA-1.6-7B</td><td>3</td><td>3</td><td>3</td><td>3</td><td>3</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>LLaVA-1.5-7B</td><td>3</td><td>3</td><td>3</td><td>3</td><td>2</td>
+                    <td>Idefics1</td><td>4</td><td>4</td><td>3</td><td>1</td><td>2</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>PIQE</td><td>1</td><td>1</td><td>1</td><td>1</td><td>1</td>
+                    <td>DINO-sim</td><td>1</td><td>1</td><td>1</td><td>1</td><td>1</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>SSIM-dyn</td><td>3</td><td>3</td><td>3</td><td>3</td><td>3</td>
+                    <td>CLIP-Score</td><td>2</td><td>2</td><td>2</td><td>2</td><td>2</td>
+                  </tr>
+              </tbody>
+            </table>
+        </div>
+
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/case_study/3004368.gif" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              prompt: Illustrate a bustling market scene, with fresh produce displayed on stalls, attracting villagers eager to purchase, cartoon style
+            </p>
+          </div>
+        </div>
+
+        <div class="column is-two-thirds">
+            <table class="table is-full-width is-striped is-size-7">
+              <thead>
+                <tr style="background-color: rgba(180, 180, 180, 0.15);">
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr>
+              </thead>
+              <tbody>
+                  <tr style="background-color: rgba(245, 123, 113, 0.15);">
+                    <td>Human score</td><td>1</td><td>2</td><td>3</td><td>2</td><td>2</td>
+                    <td></td><td></td><td></td><td></td><td></td><td></td>
+                  </tr>
+                  <tr style="background-color: rgba(110, 194, 134, 0.15);">
+                    <td>VideoScore (reg)</td><td>1.91</td><td>1.86</td><td>2.84</td><td>2.44</td><td>1.67</td>
+                    <td>VideoScore (gen)</td><td>2</td><td>1</td><td>3</td><td>1</td><td>1</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>GPT-4o</td><td>3</td><td>3</td><td>3</td><td>4</td><td>4</td>
+                    <td>Gemini-1.5-Pro</td><td>2</td><td>2</td><td>1</td><td>3</td><td>3</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>Gemini-1.5-Flash</td><td>3</td><td>1</td><td>1</td><td>2</td><td>3</td>
+                    <td>LLaVA-1.6-7B</td><td>3</td><td>3</td><td>3</td><td>3</td><td>3</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>LLaVA-1.5-7B</td><td>3</td><td>3</td><td>3</td><td>2</td><td>2</td>
+                    <td>Idefics1</td><td>4</td><td>4</td><td>3</td><td>1</td><td>2</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>PIQE</td><td>2</td><td>2</td><td>2</td><td>2</td><td>2</td>
+                    <td>DINO-sim</td><td>4</td><td>4</td><td>4</td><td>4</td><td>4</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>SSIM-dyn</td><td>2</td><td>2</td><td>2</td><td>2</td><td>2</td>
+                    <td>CLIP-Score</td><td>3</td><td>3</td><td>3</td><td>3</td><td>3</td>
+                  </tr>
+              </tbody>
+            </table>
+          </div>
+
+          <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/case_study/8000454.gif" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              prompt: Every day must be Sunday Amusement park inside the school
+            </p>
+          </div>
+        </div>
+
+        <div class="column is-two-thirds">
+            <table class="table is-full-width is-striped is-size-7">
+              <thead>
+                <tr style="background-color: rgba(180, 180, 180, 0.15);">
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr>
+              </thead>
+              <tbody>
+                  <tr style="background-color: rgba(245, 123, 113, 0.15);">
+                    <td>Human score</td><td>1</td><td>1</td><td>3</td><td>2</td><td>1</td>
+                    <td></td><td></td><td></td><td></td><td></td><td></td>
+                  </tr>
+                  <tr style="background-color: rgba(110, 194, 134, 0.15);">
+                    <td>VideoScore (reg)</td><td>1.04</td><td>1.42</td><td>2.95</td><td>1.97</td><td>1.09</td>
+                    <td>VideoScore (gen)</td><td>1</td><td>1</td><td>3</td><td>2</td><td>1</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>GPT-4o</td><td>3</td><td>4</td><td>2</td><td>3</td><td>3</td>
+                    <td>Gemini-1.5-Pro</td><td>2</td><td>1</td><td>2</td><td>2</td><td>1</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>Gemini-1.5-Flash</td><td>2</td><td>1</td><td>1</td><td>2</td><td>1</td>
+                    <td>LLaVA-1.6-7B</td><td>3</td><td>3</td><td>3</td><td>2</td><td>2</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>LLaVA-1.5-7B</td><td>3</td><td>3</td><td>3</td><td>2</td><td>2</td>
+                    <td>Idefics1</td><td>4</td><td>4</td><td>3</td><td>1</td><td>2</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>PIQE</td><td>1</td><td>1</td><td>1</td><td>1</td><td>1</td>
+                    <td>DINO-sim</td><td>3</td><td>3</td><td>3</td><td>3</td><td>3</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>SSIM-dyn</td><td>4</td><td>4</td><td>4</td><td>4</td><td>4</td>
+                    <td>CLIP-Score</td><td>2</td><td>2</td><td>2</td><td>2</td><td>2</td>
+                  </tr>
+              </tbody>
+            </table>
+          </div>
+
+      
+
+      </div>
+    </div>
+      
+    <div class="hero-body has-text-centered">
+      <h2 class="title is-4">
+            <span style="vertical-align: middle">
+            ⚔️GenAI-Bench</span>
+      </h2>
+    </div>
+
+    <div class="container is-max-desktop">
+      <div class="columns is-centered">
+        <div class="column is-full-width">
+            <p style="text-align:center">
+              In each item we have two videos with same prompt and a human preference annotation. 
+              For VideoScore and MLLM prompting methods, we use average score of all 5 dimensions to predict preference, 
+              while for feature-based metrics, we use their discretized output for the prediction of preference direcly.
+            </p>
+        </div>
+      </div>
+
+      <div class="columns is-multiline">
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/case_study/0_left.gif" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              Left Video<br>
+              prompt: a cute dog is playing a ball
+            </p>
+          </div>
+        </div>
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="70%" src="static/case_study/0_right.gif" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              Right Video<br>
+              prompt: a cute dog is playing a ball
+            </p>
+          </div>
+        </div>
+
+        <div class="column is-one-third">
+            <img width="100%" src="static/case_study/genai_0.png" alt="GIF">
+        </div>
+      </div>
+
+      <div class="columns is-multiline">
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="static/case_study/13_left.gif" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              Left Video<br>
+              prompt: An astronaut flying in space, oil painting
+            </p>
+          </div>
+        </div>
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="70%" src="static/case_study/13_right.gif" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              Right Video<br>
+              prompt: An astronaut flying in space, oil painting
+            </p>
+          </div>
+        </div>
+
+        <div class="column is-one-third">
+            <img width="100%" src="static/case_study/genai_13.png" alt="GIF">
+        </div>
+      </div>
+  
+    </div>
+
+  </section>
+
+<!--  -->
+
+<section class="section" id="BibTeX">
+  <div class="container is-max-desktop content">
+    
+    <h2 class="title">BibTeX</h2>
+    <pre><code>@article{he2024videoscore,
+  title = {VideoScore: Building Automatic Metrics to Simulate Fine-grained Human Feedback for Video Generation},
+  author = {He, Xuan and Jiang, Dongfu and Zhang, Ge and Ku, Max and Soni, Achint and Siu, Sherman and Chen, Haonan and Chandra, Abhranil and Jiang, Ziyan and Arulraj, Aaran and Wang, Kai and Do, Quy Duc and Ni, Yuansheng and Lyu, Bohan and Narsupalli, Yaswanth and Fan, Rongqi and Lyu, Zhiheng and Lin, Yuchen and Chen, Wenhu},
+  journal = {ArXiv},
+  year = {2024},
+  volume={abs/2406.15252},
+  url = {https://arxiv.org/abs/2406.15252},
+}
+    </code></pre>
+  </div>
+</section>
+
+
+</body>
+
+</html>
diff --git a/static/case_study/0_left.gif b/static/case_study/0_left.gif
new file mode 100644
index 0000000..f038cb3
Binary files /dev/null and b/static/case_study/0_left.gif differ
diff --git a/static/case_study/0_right.gif b/static/case_study/0_right.gif
new file mode 100644
index 0000000..ddf2961
Binary files /dev/null and b/static/case_study/0_right.gif differ
diff --git a/static/case_study/13_left.gif b/static/case_study/13_left.gif
new file mode 100644
index 0000000..0d88956
Binary files /dev/null and b/static/case_study/13_left.gif differ
diff --git a/static/case_study/13_right.gif b/static/case_study/13_right.gif
new file mode 100644
index 0000000..0838b2c
Binary files /dev/null and b/static/case_study/13_right.gif differ
diff --git a/static/case_study/3004368.gif b/static/case_study/3004368.gif
new file mode 100644
index 0000000..aa9d6db
Binary files /dev/null and b/static/case_study/3004368.gif differ
diff --git a/static/case_study/5000217.gif b/static/case_study/5000217.gif
new file mode 100644
index 0000000..6f93092
Binary files /dev/null and b/static/case_study/5000217.gif differ
diff --git a/static/case_study/8000454.gif b/static/case_study/8000454.gif
new file mode 100644
index 0000000..b32aaf7
Binary files /dev/null and b/static/case_study/8000454.gif differ
diff --git a/static/case_study/genai_0.png b/static/case_study/genai_0.png
new file mode 100644
index 0000000..58523c4
Binary files /dev/null and b/static/case_study/genai_0.png differ
diff --git a/static/case_study/genai_13.png b/static/case_study/genai_13.png
new file mode 100644
index 0000000..5fb05bc
Binary files /dev/null and b/static/case_study/genai_13.png differ
diff --git a/static/css/index.css b/static/css/index.css
new file mode 100644
index 0000000..8578ca4
--- /dev/null
+++ b/static/css/index.css
@@ -0,0 +1,159 @@
+body {
+  font-family: 'Noto Sans', sans-serif;
+}
+
+
+.footer .icon-link {
+    font-size: 25px;
+    color: #000;
+}
+
+.link-block a {
+    margin-top: 5px;
+    margin-bottom: 5px;
+}
+
+.dnerf {
+  font-variant: small-caps;
+}
+
+
+.teaser .hero-body {
+  padding-top: 0;
+  padding-bottom: 3rem;
+}
+
+.teaser {
+  font-family: 'Google Sans', sans-serif;
+}
+
+
+.publication-title {
+}
+
+.publication-banner {
+  max-height: parent;
+
+}
+
+.publication-banner video {
+  position: relative;
+  left: auto;
+  top: auto;
+  transform: none;
+  object-fit: fit;
+}
+
+.publication-header .hero-body {
+}
+
+.publication-title {
+    font-family: 'Google Sans', sans-serif;
+}
+
+.publication-authors {
+    font-family: 'Google Sans', sans-serif;
+}
+
+.publication-venue {
+    color: #555;
+    width: fit-content;
+    font-weight: bold;
+}
+
+.publication-awards {
+    color: #ff3860;
+    /* width: fit-content; */
+    font-weight: bolder;
+}
+
+.title + .publication-authors,
+.subtitle + .publication-authors {
+    margin-top: -1.25rem;
+}
+
+.publication-authors a {
+   color: hsl(204, 86%, 53%) !important;
+}
+
+.publication-authors a:hover {
+    text-decoration: underline;
+}
+
+.author-block {
+  display: inline-block;
+}
+
+.publication-banner img {
+}
+
+.publication-authors {
+  /*color: #4286f4;*/
+}
+
+.publication-video {
+    position: relative;
+    width: 100%;
+    height: 0;
+    padding-bottom: 56.25%;
+
+    overflow: hidden;
+    border-radius: 10px !important;
+}
+
+.publication-video iframe {
+    position: absolute;
+    top: 0;
+    left: 0;
+    width: 100%;
+    height: 100%;
+}
+
+.publication-body img {
+}
+
+.results-carousel {
+  overflow: hidden;
+}
+
+.results-carousel .item {
+  margin: 5px;
+  overflow: hidden;
+  border: 1px solid #bbb;
+  border-radius: 10px;
+  padding: 0;
+  font-size: 0;
+}
+
+.results-carousel video {
+  margin: 0;
+}
+
+
+.interpolation-panel {
+  background: #f5f5f5;
+  border-radius: 10px;
+}
+
+.interpolation-panel .interpolation-image {
+  width: 100%;
+  border-radius: 5px;
+}
+
+.interpolation-video-column {
+}
+
+.interpolation-panel .slider {
+  margin: 0 !important;
+}
+
+.interpolation-panel .slider {
+  margin: 0 !important;
+}
+
+#interpolation-image-wrapper {
+  width: 100%;
+}
+#interpolation-image-wrapper img {
+  border-radius: 5px;
+}
\ No newline at end of file
diff --git a/static/eg_videos/0004577.gif b/static/eg_videos/0004577.gif
new file mode 100644
index 0000000..0d37b1c
Binary files /dev/null and b/static/eg_videos/0004577.gif differ
diff --git a/static/eg_videos/1005886.gif b/static/eg_videos/1005886.gif
new file mode 100644
index 0000000..abdd194
Binary files /dev/null and b/static/eg_videos/1005886.gif differ
diff --git a/static/eg_videos/2003040.gif b/static/eg_videos/2003040.gif
new file mode 100644
index 0000000..0704a1d
Binary files /dev/null and b/static/eg_videos/2003040.gif differ
diff --git a/static/eg_videos/2004537.gif b/static/eg_videos/2004537.gif
new file mode 100644
index 0000000..912347e
Binary files /dev/null and b/static/eg_videos/2004537.gif differ
diff --git a/static/eg_videos/2006682.gif b/static/eg_videos/2006682.gif
new file mode 100644
index 0000000..b3168ec
Binary files /dev/null and b/static/eg_videos/2006682.gif differ
diff --git a/static/eg_videos/3003666.gif b/static/eg_videos/3003666.gif
new file mode 100644
index 0000000..d982c52
Binary files /dev/null and b/static/eg_videos/3003666.gif differ
diff --git a/static/eg_videos/4002328.gif b/static/eg_videos/4002328.gif
new file mode 100644
index 0000000..d9df3e8
Binary files /dev/null and b/static/eg_videos/4002328.gif differ
diff --git a/static/eg_videos/4004440.gif b/static/eg_videos/4004440.gif
new file mode 100644
index 0000000..9a1057f
Binary files /dev/null and b/static/eg_videos/4004440.gif differ
diff --git a/static/eg_videos/5001175.gif b/static/eg_videos/5001175.gif
new file mode 100644
index 0000000..feb5bbb
Binary files /dev/null and b/static/eg_videos/5001175.gif differ
diff --git a/static/eg_videos/6003973.gif b/static/eg_videos/6003973.gif
new file mode 100644
index 0000000..ffb9ec4
Binary files /dev/null and b/static/eg_videos/6003973.gif differ
diff --git a/static/eg_videos/7003198.gif b/static/eg_videos/7003198.gif
new file mode 100644
index 0000000..a97f0cd
Binary files /dev/null and b/static/eg_videos/7003198.gif differ
diff --git a/static/eg_videos/7003618.gif b/static/eg_videos/7003618.gif
new file mode 100644
index 0000000..7c43045
Binary files /dev/null and b/static/eg_videos/7003618.gif differ
diff --git a/static/eg_videos/8001892.gif b/static/eg_videos/8001892.gif
new file mode 100644
index 0000000..ab5eff9
Binary files /dev/null and b/static/eg_videos/8001892.gif differ
diff --git a/static/eg_videos/9000384.gif b/static/eg_videos/9000384.gif
new file mode 100644
index 0000000..93dee18
Binary files /dev/null and b/static/eg_videos/9000384.gif differ
diff --git a/static/eg_videos/9000974.gif b/static/eg_videos/9000974.gif
new file mode 100644
index 0000000..07ce708
Binary files /dev/null and b/static/eg_videos/9000974.gif differ
diff --git a/static/eg_videos/p005353.gif b/static/eg_videos/p005353.gif
new file mode 100644
index 0000000..8acc15d
Binary files /dev/null and b/static/eg_videos/p005353.gif differ
diff --git a/static/eg_videos/s000444.gif b/static/eg_videos/s000444.gif
new file mode 100644
index 0000000..618cfff
Binary files /dev/null and b/static/eg_videos/s000444.gif differ
diff --git a/static/eg_videos/s000907.gif b/static/eg_videos/s000907.gif
new file mode 100644
index 0000000..ea61384
Binary files /dev/null and b/static/eg_videos/s000907.gif differ
diff --git a/static/images/anno_example.png b/static/images/anno_example.png
new file mode 100644
index 0000000..14339b9
Binary files /dev/null and b/static/images/anno_example.png differ
diff --git a/static/images/data_logo1.png b/static/images/data_logo1.png
new file mode 100644
index 0000000..b729f7f
Binary files /dev/null and b/static/images/data_logo1.png differ
diff --git a/static/images/data_logo2.png b/static/images/data_logo2.png
new file mode 100644
index 0000000..879abdb
Binary files /dev/null and b/static/images/data_logo2.png differ
diff --git a/static/images/data_logo3.png b/static/images/data_logo3.png
new file mode 100644
index 0000000..b10a0b0
Binary files /dev/null and b/static/images/data_logo3.png differ
diff --git a/static/images/data_logo4.png b/static/images/data_logo4.png
new file mode 100644
index 0000000..93b0ee0
Binary files /dev/null and b/static/images/data_logo4.png differ
diff --git a/static/images/dataset.png b/static/images/dataset.png
new file mode 100644
index 0000000..f4c0c8c
Binary files /dev/null and b/static/images/dataset.png differ
diff --git a/static/images/ec_icon.png b/static/images/ec_icon.png
new file mode 100644
index 0000000..fa4b4ce
Binary files /dev/null and b/static/images/ec_icon.png differ
diff --git a/static/images/logo.png b/static/images/logo.png
new file mode 100644
index 0000000..923762a
Binary files /dev/null and b/static/images/logo.png differ
diff --git a/static/images/res_eval_crafter.png b/static/images/res_eval_crafter.png
new file mode 100644
index 0000000..e801c56
Binary files /dev/null and b/static/images/res_eval_crafter.png differ
diff --git a/static/images/res_genai_vbench.png b/static/images/res_genai_vbench.png
new file mode 100644
index 0000000..27b857b
Binary files /dev/null and b/static/images/res_genai_vbench.png differ
diff --git a/static/images/res_video_eval.png b/static/images/res_video_eval.png
new file mode 100644
index 0000000..3dc8058
Binary files /dev/null and b/static/images/res_video_eval.png differ
diff --git a/static/images/subscore_def.png b/static/images/subscore_def.png
new file mode 100644
index 0000000..9493ee3
Binary files /dev/null and b/static/images/subscore_def.png differ
diff --git a/static/images/teaser.png b/static/images/teaser.png
new file mode 100644
index 0000000..09a42ea
Binary files /dev/null and b/static/images/teaser.png differ
diff --git a/static/images/wordcloud.png b/static/images/wordcloud.png
new file mode 100644
index 0000000..6c0c4d1
Binary files /dev/null and b/static/images/wordcloud.png differ
diff --git a/templates/gif.html b/templates/gif.html
new file mode 100644
index 0000000..45d1e20
--- /dev/null
+++ b/templates/gif.html
@@ -0,0 +1,225 @@
+    <hr style="height: 2px; background: #333">
+    <div class="container">
+      <div class="columns is-multiline">
+        <!-- Row 1 -->
+        <!-- 1, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/0004577.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: completely base your choice of which one to visit today on the dish that most entices your taste buds, 1080P, high quality, comic
+              <br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>3</td><td>3</td><td>1</td><td>3</td><td>3</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 1, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/1005886.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: an African American female video editor editing videos<br><br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>1</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+
+          </div>
+        </div>
+        <!-- 1, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/2003040.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: Cinematic, A light rain is falling. Tea pickers are picking tea in a tea garden, 4K, anime style<br><br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>3</td><td>2</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- Row 2 -->
+        <!-- 2, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/3003666.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: crypto new year Christmas santa money dollars pack<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>2</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 2, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/4004440.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: Woman receiving a rose and blushing with a smile<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>2</td><td>2</td><td>3</td><td>3</td><td>2</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 2, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/5001175.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: panorama gold coast city  in future as a dystopian prison<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>2</td><td>3</td><td>3</td><td>2</td><td>3</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- Row 3 -->
+        <!-- 3, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/6003973.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: little bear looks surprised as the moon gets smaller<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>2</td><td>3</td><td>1</td><td>2</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 3, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/7003198.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: alexandra daddario, upperbody focus, slow motion, cinematic<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>2</td><td>2</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        
+        <!-- 3, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/8001892.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: cinematic portrait of two dogs running away from a medieval man<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>2</td><td>3</td><td>2</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- Row 4 -->
+        <!-- 4, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/9000974.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: a skateboard on the bottom of a surfboard, front view<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>3</td><td>3</td><td>3</td><td>3</td><td>2</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 4, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="25%" src="{{ url_for('static', filename='eg_videos/p005353.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: yellow van with trailer starts to back up<br><br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>4</td><td>4</td><td>4</td><td>4</td><td>4</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 4, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/s000907.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: five gray wolf pups frolicking and chasing each other around a remote gravel road, surrounded by grass. The pups run and leap, chasing each other, and nipping at each other, playing<br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>4</td><td>2</td><td>4</td><td>2</td><td>4</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+
+      </div>
+    </div>
+    <hr style="height: 2px; background: #333">
\ No newline at end of file
diff --git a/templates/index.html b/templates/index.html
new file mode 100644
index 0000000..a6e617a
--- /dev/null
+++ b/templates/index.html
@@ -0,0 +1,1123 @@
+
+<!DOCTYPE html>
+<html>
+
+<head>
+  <meta charset="utf-8">
+  <meta name="description" content="text-to-video generation evaluation">
+  <meta name="keywords" content="multimodal evaluation">
+  <meta name="viewport" content="width=device-width, initial-scale=1">
+  <title>MantisScore</title>
+
+  <link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro">
+  <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bulma@0.9.3/css/bulma.min.css">
+  
+  <link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/bootstrap/4.5.2/css/bootstrap.min.css">
+  <link rel="stylesheet" href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
+  <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.1/css/all.min.css">
+  <link rel="stylesheet" href="./static/css/index.css">
+  <link href="https://fonts.googleapis.com/icon?family=Material+Icons" rel="stylesheet">
+
+  <link rel="icon" href="images/logo3.png?v=2">
+
+  <script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
+  <script defer src="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.1/js/all.min.js"></script>
+  <script type="module" src="https://gradio.s3-us-west-2.amazonaws.com/4.16.0/gradio.js"></script>
+</head>
+
+<style>
+
+    .ms-bg-color{
+      background-color: rgba(110, 194, 134, 0.15);
+    }
+    .feat-bg-color{
+      background-color: rgba(42, 149, 235, 0.15);
+    }
+    .mllm-bg-color{
+      background-color: rgba(255, 208, 80, 0.15);
+    }
+
+    .text-with-background {
+      padding: 1rem; 
+      border-radius: 5px; 
+      box-shadow: 0 2px 4px rgba(0, 0, 0, 0.1); 
+    }
+    .gif-container {
+      display: flex;
+      flex-direction: column;
+      align-items: center;
+      margin-bottom: 2rem; 
+    }
+    .gif-wrapper {
+      width: 80%;
+      height: 200px; 
+      display: flex;
+      justify-content: center;
+      align-items: center;
+      background-color: #f5f5f5; 
+    }
+    .gif-wrapper img {
+      max-height: 100%;
+      max-width: 100%;
+      object-fit: contain; 
+    }
+
+    .carousel-container {
+        position: relative;
+        overflow: hidden;
+    }
+    .carousel {
+        display: flex;
+        transition: transform 0.5s ease-in-out;
+    }
+    .carousel-item {
+        min-width: 100%;
+        box-sizing: border-box;
+    }
+    .carousel-arrow {
+        position: absolute;
+        top: 50%;
+        transform: translateY(-50%);
+        background-color: rgba(0, 0, 0, 0.5);
+        color: white;
+        border: none;
+        padding: 10px;
+        cursor: pointer;
+    }
+    .carousel-arrow.left {
+        left: 10px;
+    }
+    .carousel-arrow.right {
+        right: 10px;
+    }
+
+  .expandable-card .card-text-container {
+    max-height: 200px;
+    overflow-y: hidden;
+    position: relative;
+  }
+
+  .expandable-card.expanded .card-text-container {
+    max-height: none;
+  }
+
+  .expand-btn {
+    position: relative;
+    display: none;
+    background-color: rgba(255, 255, 255, 0.8);
+    /* margin-top: -20px; */
+    /* justify-content: center; */
+    color: #510c75;
+    border-color: transparent;
+  }
+
+  .expand-btn:hover {
+    background-color: rgba(200, 200, 200, 0.8);
+    text-decoration: none;
+    border-color: transparent;
+    color: #510c75;
+  }
+
+  .expand-btn:focus {
+    outline: none;
+    text-decoration: none;
+  }
+
+  .expandable-card:not(.expanded) .card-text-container:after {
+    content: "";
+    position: absolute;
+    bottom: 0;
+    left: 0;
+    width: 100%;
+    height: 90px;
+    background: linear-gradient(rgba(255, 255, 255, 0.2), rgba(255, 255, 255, 1));
+  }
+
+  .expandable-card:not(.expanded) .expand-btn {
+    margin-top: -40px;
+  }
+
+  .card-body {
+    padding-bottom: 5px;
+  }
+
+  .vertical-flex-layout {
+    justify-content: center;
+    align-items: center;
+    height: 100%;
+    display: flex;
+    flex-direction: column;
+    gap: 5px;
+  }
+
+  .figure-img {
+    max-width: 100%;
+    height: auto;
+  }
+
+  .adjustable-font-size {
+    font-size: calc(0.5rem + 2vw);
+  }
+
+  .chat-history {
+    flex-grow: 1;
+    overflow-y: auto;
+    /* overflow-x: hidden; */
+    padding: 5px;
+    border-bottom: 1px solid #ccc;
+    margin-bottom: 10px;
+  }
+
+  #gradio pre {
+    background-color: transparent;
+  }
+</style>
+
+<body>
+
+<!----------------------------------------- Title and Authors. --------------------------------------------------->
+  <section class="hero">
+    <div class="hero-body">
+      <div class="container is-max-desktop">
+        <div class="columns is-centered">
+          <div class="column has-text-centered">
+            <h1 class="title is-1 publication-title is-bold">
+              <img id="painting_icon" width="3%" src="{{ url_for('static', filename='images/logo3.png') }}">
+              MantisScore </h1>
+              <h2 class="subtitle is-3 publication-subtitle"> A Reliable Fine-grained Metric for Video Generation</h2>
+              <br> 
+              <div class="is-size-5 publication-authors">
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup><sup>,</sup><sup style="color:#007bff;">2</sup><sup>,†</sup>
+                    <a href="" style="font-weight:normal;">Xuan He*</a>,
+                  </span>
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup><sup>,†</sup>
+                    <a href="https://jdf-prog.github.io/" style="font-weight:normal;">Dongfu Jiang*</a>,
+                  </span>
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup><sup>,</sup><sup style="color:#ed4b82;">3</sup>
+                    <a href="" style="font-weight:normal;">Ge Zhang</a>,
+                  </span>
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup>
+                    <a href="https://kuwingfung.github.io/" style="font-weight:normal;">Max Ku</a>,
+                  </span>
+                  <br>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Achint Soni,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Sherman Siu,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Haonan Chen,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Abhranil Chandra,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Ziyan Jiang,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Aaran Arulraj,</span>
+                  <sup style="color:#9b51e0;">4</sup><span class="author-block">Kai Wang,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Quy Duc Do,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Yuansheng Ni,</span>
+                  <sup style="color:#007bff;">2</sup><span class="author-block">Bohan Lyu,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Yaswanth Narsupalli,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Rongqi Fan,</span>
+                  <sup style="color:#ffac33;">1</sup><span class="author-block">Zhiheng Lyu,</span>
+                  <span class="author-block">
+                    <sup style="color:#6fbf73;">5</sup><a href="https://yuchenlin.xyz/" style="font-weight:normal;">Bill Yuchen Lin</a>,
+                  </span>
+                  <span class="author-block">
+                    <sup style="color:#ffac33;">1,</sup><sup>,†</sup>
+                    <a href="https://wenhuchen.github.io/" style="font-weight:normal;">Wenhu Chen</a>
+                  </span>
+              </div>  
+            <br>           
+            <div class="is-size-5 publication-authors">
+                <span class="author-block">
+                    <sup style="color:#ffac33;">1</sup>University of Waterloo, 
+                    <sup style="color:#007bff;">2</sup>Tsinghua University, 
+                    <sup style="color:#ed4b82;">3</sup>StarDust.AI, 
+                    <sup style="color:#9b51e0;">4</sup>University of Toronto, 
+                    <sup style="color:#6fbf73;">5</sup>AI2          
+                </span>
+            </div>  
+            <br>   
+            <div class="is-size-5 publication-authors">
+              <span class="author-block">
+                    *Equal Contribution
+              </span>
+            </div>
+            <div class="is-size-5 publication-authors">
+                <span class="author-block">†Corresponding to:</span>
+                <span class="author-block"><a href="mailto:hexuan21@mails.tsinghua.edu.cn">hexuan21@mails.tsinghua.edu.cn</a>,</span>
+                <span class="author-block"><a href="mailto:dongfu.jiang@uwaterloo.ca">dongfu.jiang@uwaterloo.ca</a>,</span>
+                <span class="author-block"><a href="mailto:wenhuchen@uwaterloo.ca">wenhuchen@uwaterloo.ca</a></span>
+            </div>
+
+            <div class="column has-text-centered">
+              <div class="publication-links">
+                <span class="link-block">
+                  <a href="" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      <i class="ai ai-arxiv"></i>
+                    </span>
+                    <span>Paper</span>
+                  </a>
+                </span>
+
+                <span class="link-block">
+                  <a href="https://github.com/TIGER-AI-Lab/MantisScore/" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      <i class="fab fa-github"></i>
+                    </span>
+                    <span>Code</span>
+                  </a>
+                </span>
+
+                <span class="link-block">
+                  <a href="https://huggingface.co/datasets/TIGER-Lab/VideoEval" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      <i class="fas fa-database"></i>
+                    </span>
+                    <span>VideoEval</span>
+                  </a>
+                </span>
+
+                <!--<span class="link-block">
+                  <a href="https://huggingface.co/datasets/TIGER-Lab/MantisScore-Bench" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      <i class="fas fa-database"></i>
+                    </span>
+                    <span>MantisScore-Bench</span>
+                  </a>
+                </span>-->
+
+                <span class="link-block">
+                  <a href="https://huggingface.co/TIGER-Lab/MantisScore" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      🔥 
+                    </span>
+                    <span>Models</span>
+                  </a>
+                </span>
+
+                <span class="link-block">
+                  <a href="https://huggingface.co/spaces/Mantis-VL/MantisScore" target="_blank"
+                    class="external-link button is-normal is-rounded is-dark">
+                    <span class="icon">
+                      🤗
+                    </span>
+                    <span>Spaces</span>
+                  </a>
+                </span>
+
+                <span class="link-block">
+                  <a href=""
+                   class="external-link button is-normal is-rounded is-dark">
+                  <span class="icon has-text-white">
+                    <i class="fab fa-twitter"></i>
+                  </span>
+                  <span>Twitter</span>
+                </a>
+              </span>
+
+              </div>
+            </div>
+
+            <centering>
+              <div style="text-align: center;">
+                <img id="teaser" width="85%" src="{{ url_for('static', filename='images/teaser.png') }}">     
+              </div>
+            </centering> 
+
+          </div>
+        </div>
+      </div>
+    </div>
+  </section>
+
+<!----------------------------------------- Demo. ------------------------------------------------------>
+
+  <section class="hero is-light is-small">
+  <div class="hero-body has-text-centered">
+    <h2 class="title is-3"> 
+      Demo - MantisScore</h2>
+  </div>
+  </section> 
+  <!--<section class="section">
+    <div class="container is-max-desktop" id="gradio">
+        <iframe
+        src="https://mantis-vl-mantisscore.hf.space/"
+        frameborder="0"
+        width="100%"
+        height="1500"
+      ></iframe>
+    </div>
+  </section>-->
+
+
+
+<!----------------------------------------- Abstract. --------------------------------------------------->
+  <section class="hero is-light is-small">
+  <div class="hero-body has-text-centered">
+    <h2 class="title is-3"> 
+      Abstract</h2>
+  </div>
+  </section>   
+
+  <section class="section">
+    <div class="container is-max-desktop">
+      <!-- Abstract. -->
+      <div class="columns is-centered has-text-centered">
+        <div class="column is-four-fifths">
+          
+          <div class="content has-text-justified">
+            <p>
+              The recent years have witnessed great advances
+              in text-to-video generation. However, <b>the video
+              evaluation metrics have lagged significantly behind</b>, which fails to produce an accurate and
+              holistic measure of the generated videos' quality. The main barrier is the lack of <b>high-quality
+              human rating data</b>. <br>
+              <ol type="I">
+                <li>
+                  <img id="painting_icon" width="3%" src="{{ url_for('static', filename='images/data_logo4.png') }}">
+                  <b>VideoEval Dataset</b>. In this paper, we release
+                  <b><i>VideoEval</i></b>, the first large-scale multi-aspect
+                  video evaluation dataset. VideoEval consists
+                  of high-quality human-provided ratings for 5
+                  video evaluation aspects on the 37.6K videos
+                  generated from 11 existing popular video generative models.
+                </li>
+                <li>
+                  <img id="painting_icon" width="3%" src="{{ url_for('static', filename='images/logo3.png') }}">
+                  <b>MantisScore</b>. 
+                  We train <b><i>MantisScore</i></b> based on VideoEval to enable automatic video quality assessment. 
+                  Experiments show that the Spearman correlation between MantisScore
+                  and humans can reach <b>77.1</b> on VideoEval test, beating the prior best metrics by about
+                  <b>50 points</b>. Further result on the held-out Eval-Crafter, GenAI-Bench, and VBench, show that
+                  MantisScore is highly generalizable and
+                  still <b>beating the prior best metrics by a remarkable margin. </b>
+                </li>
+                <li>
+                  <b>Model Variants</b>. We observe that using Mantis as
+                  the based model consistently beats that using
+                  Idefics2 and VideoLLaVA, and the regression based model can achieve better results than the
+                  generative ones.
+                </li>
+                
+              </ol>  
+              Due to its high reliability, we
+              believe MantisScore can serve as a valuable
+              tool for accelerate video generation research.
+              
+            </p>
+  
+          </div>
+        </div>
+      </div>
+    </div>
+  </section>
+
+
+
+
+<!----------------------------------------- VideoEval Dataset. --------------------------------------------------->
+<section class="hero is-light is-small">
+  <div class="hero-body has-text-centered">
+    <h2 class="title is-3">
+      <img id="painting_icon" width="3%" src="{{ url_for('static', filename='images/data_logo4.png') }}">
+           VideoEval Dataset <br> Multi-Aspect Human-Annotated Video Evaluation Data</h2>
+  </div>
+</section> 
+
+<section class="section">
+  <div class="container is-max-desktop">
+    <div class="columns is-centered has-text-centered">
+      <div class="column is-full-width">
+        <div class="content has-text-justified has-text-centered">
+          <p>
+                VideoEval contains a total of <b>37.6K</b> text-to-video pairs from 11 popular video generative models, 
+                with some real-world videos as data augmentation. 
+                The videos are annotated by raters for five evaluation dimensions: <b>Visual Quality</b>, <b>Temporal Consistency</b>, <b>Dynamic Degree</b>,
+                 <b>Text-to-Video Alignment</b> and <b>Factual Consistency</b>, 
+                in 1-4 scoring scale. Below we show the detailed description of our VideoEval dataset.
+                Please check out 
+                <a href="https://huggingface.co/TIGER-Lab/VideoEval">🤗 <b>VideoEval</b></a> 
+                on hugging face datasets for usage.
+
+              <p></p>
+
+              <centering>
+                <div style="text-align: center;">
+                    <h3 class="title is-4">Statistics</h3>
+                    <img id="dataset" width="75%" src="{{ url_for('static', filename='images/dataset.png') }}">     
+                <div
+              </centering>
+          </p>
+        </div>
+      </div>
+    </div>
+    <br>
+    <br>
+
+    <div class="columns is-centered has-text-centered">
+      <div class="column is-full-width">
+          <h3 class="title is-4">Annotation Examples</h3>
+          <b style="color:#007bff;">1-Bad, 2-Average, 3-Good, 4-Real/Perfect</b><br>
+      </div>
+    </div>
+
+        <hr style="height: 2px; background: #333">
+    <div class="container">
+      <div class="columns is-multiline">
+        <!-- Row 1 -->
+        <!-- 1, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/0004577.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: completely base your choice of which one to visit today on the dish that most entices your taste buds, 1080P, high quality, comic
+              <br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>3</td><td>3</td><td>1</td><td>3</td><td>3</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 1, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/1005886.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: an African American female video editor editing videos<br><br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>1</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+
+          </div>
+        </div>
+        <!-- 1, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/2003040.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: Cinematic, A light rain is falling. Tea pickers are picking tea in a tea garden, 4K, anime style<br><br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>3</td><td>2</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- Row 2 -->
+        <!-- 2, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/3003666.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: crypto new year Christmas santa money dollars pack<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>2</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 2, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/4004440.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: Woman receiving a rose and blushing with a smile<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>2</td><td>2</td><td>3</td><td>3</td><td>2</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 2, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/5001175.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: panorama gold coast city  in future as a dystopian prison<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>2</td><td>3</td><td>3</td><td>2</td><td>3</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- Row 3 -->
+        <!-- 3, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/6003973.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: little bear looks surprised as the moon gets smaller<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>2</td><td>3</td><td>1</td><td>2</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 3, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/7003198.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: alexandra daddario, upperbody focus, slow motion, cinematic<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>2</td><td>2</td><td>3</td><td>3</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        
+        <!-- 3, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/8001892.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: cinematic portrait of two dogs running away from a medieval man<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>1</td><td>2</td><td>3</td><td>2</td><td>1</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- Row 4 -->
+        <!-- 4, 1 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/9000974.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: a skateboard on the bottom of a surfboard, front view<br>
+              
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>3</td><td>3</td><td>3</td><td>3</td><td>2</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 4, 2 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="25%" src="{{ url_for('static', filename='eg_videos/p005353.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: yellow van with trailer starts to back up<br><br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>4</td><td>4</td><td>4</td><td>4</td><td>4</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+        <!-- 4, 3 -->
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='eg_videos/s000907.gif') }}" alt="GIF 1">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;">
+              prompt: five gray wolf pups frolicking and chasing each other around a remote gravel road, surrounded by grass. The pups run and leap, chasing each other, and nipping at each other, playing<br>
+            </p>
+            <table class="table is-two-fifths">
+              <thead><tr style="background-color: rgba(110, 194, 134, 0.15);">
+                  <th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr></thead>
+              <tbody><tr ><td>4</td><td>2</td><td>4</td><td>2</td><td>4</td></tr></tbody>
+            </table>
+          </div>
+        </div>
+
+      </div>
+    </div>
+    <hr style="height: 2px; background: #333">
+
+
+  </div>  
+
+  </section>
+
+<!----------------------------------------- MantisScore. --------------------------------------------------->  
+<section class="hero is-light is-small">
+  <div class="hero-body has-text-centered">
+  <h2 class="title is-3">
+    <img id="painting_icon" width="3%" src="{{ url_for('static', filename='images/logo3.png') }}">
+    <span style="vertical-align: middle">MantisScore</span>
+  </h2>
+  </div>
+</section>  
+
+<section class="section"> 
+  <div class="container is-max-desktop">
+    <div class="columns is-centered">
+      <div class="column is-full-width">
+        <div class="content has-text-justified"> 
+          <p>
+            MantisScore is finetuned on VideoEval dataset's 37K training set taking 
+            <a href="https://huggingface.co/openai/clip-vit-large-patch14-336">Mantis-8B-Idefics2</a> as base model. 
+            We try generation scoring method and regression scoring method, 
+            the former one means model's answer is in a template 
+            predefined for video quality evaluation 
+            while the latter one outputs 5 logits as evaluation scores in 5 dimensions.
+         
+            Besides, we also make ablation on base model, using 
+            <a href="https://huggingface.co/openai/clip-vit-large-patch14-336">Mantis-8B-Idefics2</a>, 
+            <a href="https://huggingface.co/HuggingFaceM4/idefics2-8b">Idefics2-8B</a>
+             and 
+             <a href="https://huggingface.co/LanguageBind/Video-LLaVA-7B">VideoLLaVA-7B </a>
+            as base models to finetune. Mantis-8B-Idefics2 turns out to 
+            have the best performance on video quality evaluation.
+          </p>
+        </div>          
+      </div>
+    </div>
+  </div>
+
+  <div class="hero-body has-text-centered">
+    <h2 class="title is-4">
+      <span style="vertical-align: middle">Video Evaluation Benchmarks</span>
+    </h2>
+  </div>
+  <div class="container is-max-desktop">
+    <div class="columns is-centered">
+      <div class="column is-full-width">
+        <h2 class="title is-5"><span style="font-size: 100%;">
+          <img id="painting_icon" width="3%" src="{{ url_for('static', filename='images/data_logo4.png') }}">
+          VideoEval-test</span></h2>
+        <p>
+          We test our video evaluator MantisScore on VideoEval-test set, 
+          Here is the results of some feature-based metrics like PIQE, CLIP-sim, X-CILIP-Sore etc, 
+          MLLM-prompting methods like GPT-4o Gemini-1.5-Pro, etc and our MantisScore. 
+          As seen in the table below, MantisScore surpass the best baseline by 54.1 in average on 5 aspects. 
+        </p>
+        <br>
+        <h2 class="title is-5"><span style="font-size: 100%;">
+          <img id="painting_icon" width="3%" src="{{ url_for('static', filename='images/ec_icon.png') }}">
+          EvalCrafter Benchmark</span></h2>
+        <p>
+          We select 3 dimensions from EvalCrafter that match our evaluation aspects 
+          and collect 2500+ videos for test. MantisScore surpass all the baselines in 3 apsects 
+          and EvalCrafter(GPT-4V) in Text-to-Video Alignment.
+        </p>
+        <br>
+        <h2 class="title is-5"><span style="font-size: 100%;">⚔️GenAI-Bench and VBench</span></h2>
+        <p>
+            GenAI-Bench is a multimodal benchmark for MLLM's capability on preference comparison
+            for tasks like text-to-video generation, image-editing and others, while 
+            VBench is a comprehensive multi-aspect benchmark suite for
+            video generative models. For GenAI-Bench we collect 2100+ videos and 
+            for VBench select a subset from 5 aspects of VBench, like technical 
+            quality, subject consistency, and so on, then subsample 100 unique prompts (2000 videos totally) for testing.
+            We use the averaged scores of the five aspects for MLLM prompting baselines and our models to
+            give the preference and calculate the pairwise accuracy as performance indicator.
+        </p>
+        <!--<centering>
+          <div style="text-align: center;">
+              <img id="res_video_eval" width="75%" src="{{ url_for('static', filename='images/res_video_eval.png') }}">     
+          </div>
+        </centering>-->
+      </div>
+    </div>
+  </div>
+
+  <div class="hero-body has-text-centered">
+    <h2 class="title is-4">
+      <span style="vertical-align: middle">Results & Leaderboard</span>
+    </h2>
+  </div>
+
+  <div class="container is-max-desktop">
+    <div class="columns is-centered">
+      <div class="column is-four-fifths has-text-centered">
+        
+          <div class="model-labels-container is-size-5">
+
+            <span style="background-color: rgba(110, 194, 134, 0.15);padding: 5px 10px;">MantisScore series</span>
+            
+            <span style="background-color: rgba(255, 208, 80, 0.15);padding: 5px 10px;">MLLM Open Source</span>
+            <span style="background-color: rgba(42, 149, 235, 0.15);padding: 5px 10px;">Feature-Based Metric</span>
+            <p></p>
+          </div>
+
+        <table class="table is-bordered is-three-fifths">
+          <thead>
+            <tr style="background-color: rgba(211, 211, 211, 0.5);">
+              <th>Metric</th>
+              <th>Final Sum Score ↓</th>
+              <th>VideoEval-test</th>
+              <th>EvalCrafter</th>
+              <th>GenAI-Bench</th>
+              <th>VBench</th>
+            </tr>
+          </thead>
+          <tbody>
+            <tr style="background-color: rgba(110, 194, 134, 0.15);">
+              <td>MantisScore (reg)</td><td><b>278.3</b></td><td>75.7</td><td><b>51.1</b></td><td><b>78.5</b></td><td><b>73.0</b></td></tr>
+            
+            <tr style="background-color: rgba(110, 194, 134, 0.15);">
+              <td>MantisScore-(gen)</td><td>222.4</td><td><b>77.1</b></td><td>27.6</td><td>59.0</td><td>58.7</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>∆ over Best Baseline</td><td>119.5</td> <td>54.0</td><td>14.9</td><td>11.4</td><td>17.9</td></tr>
+
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Gemini-1.5-Pro</td><td><u>158.8</u></td><td>22.1</td><td>22.9</td><td>60.9</td><td>52.9</td></tr>
+              
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Gemini-1.5-Flash</td><td>157.5</td><td>20.8</td><td>17.3</td><td><u>67.1</u></td><td>52.3</td></tr>
+              
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>GPT-4o</td><td>155.4</td><td><u>23.1</u></td><td>28.7</td><td>52.0</td><td>51.7</td></tr>
+
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>CLIP-sim</td><td>126.8</td><td>8.9</td><td><u>36.2</u></td><td>34.2</td><td>47.4</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>DINO-sim</td><td>121.3</td><td>7.5</td><td>32.1</td><td>38.5</td><td>43.3</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>SSIM-sim</td><td>118.0</td><td>13.4</td><td>26.9</td><td>34.1</td><td>43.5</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>CLIP-Score</td><td>114.4</td><td>-7.2</td><td>21.7</td><td>45.0</td><td>54.9</td></tr>
+
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>LLaVA-1.5-7B</td><td>108.3</td><td>8.5</td><td>10.5</td><td>49.9</td><td>39.4</td></tr>
+            
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>LLaVA-1.6-7B</td><td>93.3</td><td>-3.1</td><td>13.2</td><td>44.5</td><td>38.7</td></tr>
+
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>X-CLIP-Score</td><td>92.9</td><td>-1.9</td><td>13.3</td><td>41.4</td><td>40.1</td></tr>
+
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>PIQE</td><td>78.3</td><td>-10.1</td><td>-1.2</td><td>34.5</td><td><u>55.1</u></td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>BRISQUE</td><td>75.9</td><td>-20.3</td><td>3.9</td><td>38.5</td><td>53.7</td></tr>
+            
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Idefics1</td><td>73.0</td><td>6.5</td><td>0.3</td><td>34.6</td><td>31.7</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>MSE-dyn</td><td>42.5</td><td>-5.5</td><td>-17.0</td><td>28.4</td><td>36.5</td></tr>
+            
+            <tr style="background-color: rgba(42, 149, 235, 0.15);">
+              <td>SSIM-dyn</td><td>36.7</td><td>-12.9</td><td>-26.4</td><td>31.4</td><td>44.5</td></tr>
+
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Fuyu</td><td>-</td><td>-</td><td>-</td><td>-</td><td>-</td></tr>
+            
+            <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>Kosmos-2</td><td>-</td><td>-</td><td>-</td><td>-</td><td>-</td></tr>
+            
+              <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>CogVLM</td><td>-</td><td>-</td><td>-</td><td>-</td><td>-</td></tr>
+            
+              <tr style="background-color: rgba(255, 208, 80, 0.15);">
+              <td>OpenFlamingo</td><td>-</td><td>-</td><td>-</td><td>-</td><td>-</td></tr> 
+
+          </tbody>
+        </table>
+        <p style="text-align:center">
+          The best MantisScore is <b>in bold</b> and the best in baselines is <u>underlined</u>. 
+          "-" means the answer of MLLM is meaningless or in wrong format. 
+        </p>
+      </div>
+    </div>
+  </div>
+    
+</section>
+
+<section class="hero is-light is-small">
+  <div class="hero-body has-text-centered">
+  <h2 class="title is-3">
+    <span style="vertical-align: middle">Case Studies</span>
+  </h2>
+  </div>
+</section>  
+
+<section>
+    <div class="hero-body has-text-centered">
+      <h2 class="title is-4">
+        <span style="vertical-align: middle">
+          <img id="painting_icon" width="3%" src="{{ url_for('static', filename='images/data_logo4.png') }}">
+            VideoEval-test</span></h2></span>
+      </h2>
+    </div>
+    <div class="container is-max-desktop">
+      <div class="columns is-centered">
+        <div class="column is-full-width">
+            <p style="text-align:center">
+              Scale of all the scores is in [1, 2, 3, 4] except for MantisScore (reg), 
+              which outputs five float logits ranging from 0.50 to 4.50. <br>
+              For scale [1, 2, 3, 4], 1-Bad, 2-Avg, 3-Good, 4-Perfect/Real. <br>
+
+
+            </p>
+        </div>
+      </div>
+
+      <div class="columns is-multiline">
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='case_study/5000217.gif') }}" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              prompt: A robot that throws a stack of paper from a desk
+            </p>
+          </div>
+        </div>
+
+        <div class="column is-two-thirds">
+            <table class="table is-full-width is-striped is-size-7">
+              <thead>
+                <tr style="background-color: rgba(180, 180, 180, 0.15);">
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr>
+              </thead>
+              <tbody>
+                  <tr style="background-color: rgba(245, 123, 113, 0.15);">
+                    <td>Human score</td><td>3</td><td>1</td><td>3</td><td>3</td><td>1</td>
+                    <td></td><td></td><td></td><td></td><td></td><td></td>
+                  </tr>
+                  <tr style="background-color: rgba(110, 194, 134, 0.15);">
+                    <td>MantisScore (reg)</td><td>2.67</td><td>0.81</td><td>3.09</td><td>2.50</td><td>0.80</td>
+                    <td>MantisScore (gen)</td><td>3</td><td>1</td><td>3</td><td>3</td><td>1</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>GPT-4o</td><td>3</td><td>4</td><td>2</td><td>3</td><td>4</td>
+                    <td>Gemini-1.5-Pro</td><td>3</td><td>1</td><td>1</td><td>3</td><td>3</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>Gemini-1.5-Flash</td><td>3</td><td>1</td><td>1</td><td>3</td><td>3</td>
+                    <td>LLaVA-1.6-7B</td><td>3</td><td>3</td><td>3</td><td>3</td><td>3</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>LLaVA-1.5-7B</td><td>3</td><td>3</td><td>3</td><td>3</td><td>2</td>
+                    <td>Idefics1</td><td>4</td><td>4</td><td>3</td><td>1</td><td>2</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>PIQE</td><td>1</td><td>-</td><td>-</td><td>-</td><td>-</td>
+                    <td>DINO-sim</td><td>-</td><td>1</td><td>-</td><td>-</td><td>-</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>SSIM-dyn</td><td>-</td><td>-</td><td>3</td><td>-</td><td>-</td>
+                    <td>CLIP-Score</td><td>-</td><td>-</td><td>-</td><td>2</td><td>-</td>
+                  </tr>
+              </tbody>
+            </table>
+        </div>
+
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='case_study/8000454.gif') }}" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              prompt: Every day must be Sunday Amusement park inside the school
+            </p>
+          </div>
+        </div>
+
+        <div class="column is-two-thirds">
+            <table class="table is-full-width is-striped is-size-7">
+              <thead>
+                <tr style="background-color: rgba(180, 180, 180, 0.15);">
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                  <th>Method</th><th>VQ</th><th>TC</th><th>DD</th><th>TVA</th><th>FC</th>
+                </tr>
+              </thead>
+              <tbody>
+                  <tr style="background-color: rgba(245, 123, 113, 0.15);">
+                    <td>Human score</td><td>1</td><td>1</td><td>3</td><td>2</td><td>1</td>
+                    <td></td><td></td><td></td><td></td><td></td><td></td>
+                  </tr>
+                  <tr style="background-color: rgba(110, 194, 134, 0.15);">
+                    <td>MantisScore (reg)</td><td>1.04</td><td>1.42</td><td>2.95</td><td>1.97</td><td>1.09</td>
+                    <td>MantisScore (gen)</td><td>1</td><td>1</td><td>3</td><td>2</td><td>1</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>GPT-4o</td><td>3</td><td>4</td><td>2</td><td>3</td><td>3</td>
+                    <td>Gemini-1.5-Pro</td><td>2</td><td>1</td><td>2</td><td>2</td><td>1</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>Gemini-1.5-Flash</td><td>2</td><td>1</td><td>1</td><td>2</td><td>1</td>
+                    <td>LLaVA-1.6-7B</td><td>3</td><td>3</td><td>3</td><td>2</td><td>2</td>
+                  </tr>
+                  <tr style="background-color: rgba(255, 208, 80, 0.15);">
+                    <td>LLaVA-1.5-7B</td><td>3</td><td>3</td><td>3</td><td>2</td><td>2</td>
+                    <td>Idefics1</td><td>4</td><td>4</td><td>3</td><td>1</td><td>2</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>PIQE</td><td>1</td><td>-</td><td>-</td><td>-</td><td>-</td>
+                    <td>DINO-sim</td><td>-</td><td>3</td><td>-</td><td>-</td><td>-</td>
+                  </tr>
+                  <tr style="background-color: rgba(42, 149, 235, 0.15);">
+                    <td>SSIM-dyn</td><td>-</td><td>-</td><td>4</td><td>-</td><td>-</td>
+                    <td>CLIP-Score</td><td>-</td><td>-</td><td>-</td><td>2</td><td>-</td>
+                  </tr>
+              </tbody>
+            </table>
+        </div>
+      
+
+      </div>
+    </div>
+      
+    <div class="hero-body has-text-centered">
+      <h2 class="title is-4">
+            <span style="vertical-align: middle">
+            ⚔️GenAI-Bench</span>
+      </h2>
+    </div>
+
+    <div class="container is-max-desktop">
+      <div class="columns is-centered">
+        <div class="column is-full-width">
+            <p style="text-align:center">
+              In GenAI-Bench, we have two videos with same prompt and a human preference annotation in each entry. 
+              For MantisScore and MLLM prompting methods, we use average score of all 5 dimensions to predict preference, 
+              while for feature-based metrics, we use their discretized output for the prediction of preference direcly.
+            </p>
+        </div>
+      </div>
+
+      <div class="columns is-multiline">
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='case_study/0_left.gif') }}" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              Left Video<br>
+              prompt: a cute dog is playing a ball
+            </p>
+          </div>
+        </div>
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="70%" src="{{ url_for('static', filename='case_study/0_right.gif') }}" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              Right Video<br>
+              prompt: a cute dog is playing a ball
+            </p>
+          </div>
+        </div>
+
+        <div class="column is-one-third">
+            <img width="100%" src="{{ url_for('static', filename='images/genaibench_0.png') }}" alt="GIF">
+        </div>
+      </div>
+
+      <div class="columns is-multiline">
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="100%" src="{{ url_for('static', filename='case_study/13_left.gif') }}" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              Left Video<br>
+              prompt: An astronaut flying in space, oil painting
+            </p>
+          </div>
+        </div>
+        <div class="column is-one-third">
+          <div class="gif-container">
+            <div class="gif-wrapper">
+              <img width="70%" src="{{ url_for('static', filename='case_study/13_right.gif') }}" alt="GIF">
+            </div>
+            <p style="text-align: left;font-family:Times New Roman;"> 
+              Right Video<br>
+              prompt: An astronaut flying in space, oil painting
+            </p>
+          </div>
+        </div>
+
+        <div class="column is-one-third">
+            <img width="100%" src="{{ url_for('static', filename='images/genaibench_13.png') }}" alt="GIF">
+        </div>
+      </div>
+  
+    </div>
+
+  </section>
+
+<!--  -->
+
+<section class="section" id="BibTeX">
+  <div class="container is-max-desktop content">
+    
+    <h2 class="title">BibTeX</h2>
+    
+  </div>
+</section>
+    
+
+</body>
+
+</html>
diff --git a/training/download.py b/training/download.py
new file mode 100644
index 0000000..19ec8bb
--- /dev/null
+++ b/training/download.py
@@ -0,0 +1,4 @@
+from huggingface_hub import hf_hub_download
+
+hf_hub_download(repo_id="TIGER-Lab/VideoFeedback", filename="annotated/frames_annotated_train.zip", repo_type="dataset", local_dir="./data")
+hf_hub_download(repo_id="TIGER-Lab/VideoFeedback", filename="annotated/frames_real_train.zip", repo_type="dataset", local_dir="./data")
diff --git a/training/download.sh b/training/download.sh
new file mode 100644
index 0000000..44de3f2
--- /dev/null
+++ b/training/download.sh
@@ -0,0 +1,11 @@
+
+mkdir -p ./data
+
+if [ -d "${bench_name}/${split}/frames_${postfix}" ]; then
+    echo "frames exists"
+else
+    echo "frames not exist, downloading..."
+    wget "https://huggingface.co/datasets/TIGER-Lab/VideoFeedback/resolve/main/real/frames_real_train.zip" -O "./data/frames_real_train.zip"
+    unzip "./data/frames_real_train.zip" -d "./data/images/"
+    rm "./data/frames_real_train.zip"    
+fi
\ No newline at end of file