anycoder-paper / index.html
SmartFlow's picture
Upload index.html with huggingface_hub
c1db41d verified
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0">
<title>JarvisArt: Tech Poster</title>
<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.0/css/all.min.css">
<style>
:root {
--primary: #6e48aa;
--secondary: #9d50bb;
--accent: #4776e6;
--dark: #1a1a2e;
--light: #f8f9fa;
--text: #333;
}
* {
margin: 0;
padding: 0;
box-sizing: border-box;
font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
}
body {
background-color: var(--dark);
color: var(--light);
line-height: 1.6;
}
.poster {
max-width: 1200px;
margin: 2rem auto;
background: linear-gradient(135deg, #1a1a2e 0%, #16213e 100%);
border-radius: 15px;
overflow: hidden;
box-shadow: 0 20px 40px rgba(0, 0, 0, 0.3);
position: relative;
border: 1px solid rgba(255, 255, 255, 0.1);
}
.poster::before {
content: '';
position: absolute;
top: 0;
left: 0;
width: 100%;
height: 100%;
background:
radial-gradient(circle at 20% 30%, rgba(110, 72, 170, 0.15) 0%, transparent 30%),
radial-gradient(circle at 80% 70%, rgba(157, 80, 187, 0.15) 0%, transparent 30%);
pointer-events: none;
}
.header {
padding: 3rem 4rem 2rem;
background: linear-gradient(to right, var(--primary), var(--secondary));
position: relative;
overflow: hidden;
}
.header::after {
content: '';
position: absolute;
bottom: -50px;
left: 0;
width: 100%;
height: 100px;
background: var(--dark);
transform: skewY(-3deg);
z-index: 1;
}
.title {
font-size: 3.5rem;
font-weight: 800;
margin-bottom: 1rem;
line-height: 1.1;
text-shadow: 2px 2px 4px rgba(0, 0, 0, 0.3);
position: relative;
z-index: 2;
}
.subtitle {
font-size: 1.5rem;
font-weight: 300;
opacity: 0.9;
margin-bottom: 1.5rem;
position: relative;
z-index: 2;
}
.authors {
display: flex;
flex-wrap: wrap;
gap: 0.5rem 1.5rem;
margin-bottom: 1rem;
position: relative;
z-index: 2;
}
.author {
font-size: 1rem;
font-weight: 500;
}
.affiliations {
display: flex;
flex-wrap: wrap;
gap: 0.5rem 1.5rem;
font-size: 0.9rem;
opacity: 0.8;
margin-bottom: 1rem;
position: relative;
z-index: 2;
}
.project-link {
display: inline-flex;
align-items: center;
gap: 0.5rem;
background: rgba(255, 255, 255, 0.1);
padding: 0.5rem 1rem;
border-radius: 50px;
text-decoration: none;
color: white;
font-weight: 500;
transition: all 0.3s ease;
position: relative;
z-index: 2;
}
.project-link:hover {
background: rgba(255, 255, 255, 0.2);
transform: translateY(-2px);
}
.content {
display: grid;
grid-template-columns: 1fr 1fr;
gap: 2rem;
padding: 3rem 4rem;
position: relative;
z-index: 2;
}
.abstract {
grid-column: 1 / -1;
background: rgba(255, 255, 255, 0.05);
padding: 2rem;
border-radius: 10px;
border-left: 4px solid var(--accent);
}
.abstract-title {
font-size: 1.5rem;
margin-bottom: 1rem;
color: var(--accent);
}
.abstract-text {
font-size: 1.1rem;
line-height: 1.7;
}
.highlight {
color: var(--accent);
font-weight: 600;
}
.features {
display: grid;
grid-template-columns: 1fr;
gap: 1.5rem;
}
.feature {
background: rgba(255, 255, 255, 0.05);
padding: 1.5rem;
border-radius: 10px;
transition: all 0.3s ease;
}
.feature:hover {
transform: translateY(-5px);
box-shadow: 0 10px 20px rgba(0, 0, 0, 0.2);
}
.feature-title {
font-size: 1.2rem;
margin-bottom: 0.5rem;
color: var(--accent);
display: flex;
align-items: center;
gap: 0.5rem;
}
.feature-icon {
font-size: 1.5rem;
}
.feature-text {
font-size: 1rem;
opacity: 0.9;
}
.image-container {
position: relative;
border-radius: 10px;
overflow: hidden;
box-shadow: 0 10px 20px rgba(0, 0, 0, 0.3);
height: 100%;
display: flex;
align-items: center;
justify-content: center;
}
.image-container img {
width: 100%;
height: auto;
object-fit: cover;
transition: transform 0.5s ease;
}
.image-container:hover img {
transform: scale(1.03);
}
.image-caption {
position: absolute;
bottom: 0;
left: 0;
right: 0;
background: rgba(0, 0, 0, 0.7);
padding: 1rem;
font-size: 0.9rem;
text-align: center;
}
.stats {
display: grid;
grid-template-columns: repeat(2, 1fr);
gap: 1.5rem;
margin-top: 1.5rem;
}
.stat {
background: rgba(255, 255, 255, 0.05);
padding: 1.5rem;
border-radius: 10px;
text-align: center;
}
.stat-value {
font-size: 2.5rem;
font-weight: 700;
color: var(--accent);
margin-bottom: 0.5rem;
}
.stat-label {
font-size: 0.9rem;
opacity: 0.8;
}
.footer {
padding: 2rem 4rem;
background: rgba(0, 0, 0, 0.3);
text-align: center;
font-size: 0.9rem;
opacity: 0.7;
position: relative;
z-index: 2;
}
@media (max-width: 992px) {
.content {
grid-template-columns: 1fr;
padding: 2rem;
}
.title {
font-size: 2.5rem;
}
.subtitle {
font-size: 1.2rem;
}
.header {
padding: 2rem;
}
}
@media (max-width: 576px) {
.title {
font-size: 2rem;
}
.subtitle {
font-size: 1rem;
}
.header {
padding: 1.5rem;
}
.content {
padding: 1.5rem;
}
.abstract {
padding: 1.5rem;
}
.stats {
grid-template-columns: 1fr;
}
}
</style>
</head>
<body>
<div class="poster">
<div class="header">
<h1 class="title">JarvisArt</h1>
<p class="subtitle">Liberating Human Artistic Creativity via an Intelligent Photo Retouching Agent</p>
<div class="authors">
<span class="author">Yunlong Lin*</span>
<span class="author">Zixu Lin*</span>
<span class="author">Kunjie Lin*</span>
<span class="author">Jinbin Bai</span>
<span class="author">Panwang Pan</span>
<span class="author">Chenxin Li</span>
<span class="author">Haoyu Chen</span>
<span class="author">Zhongdao Wang</span>
<span class="author">Xinghao Ding†</span>
<span class="author">Wenbo Li♣</span>
<span class="author">Shuicheng Yan†</span>
</div>
<div class="affiliations">
<span>Xiamen University</span>
<span>HKUST(GZ)</span>
<span>CUHK</span>
<span>Bytedance</span>
<span>NUS</span>
<span>Tsinghua University</span>
</div>
<a href="https://jarvisart.vercel.app/" class="project-link" target="_blank">
<i class="fas fa-external-link-alt"></i>
Project Page
</a>
</div>
<div class="content">
<div class="abstract">
<h2 class="abstract-title">Abstract</h2>
<p class="abstract-text">
We introduce <span class="highlight">JarvisArt</span>, a multi-modal large language model (MLLM)-driven agent that understands user intent, mimics professional artists' reasoning, and intelligently coordinates over <span class="highlight">200 retouching tools</span> within Lightroom. JarvisArt undergoes a two-stage training process and demonstrates <span class="highlight">user-friendly interaction</span>, superior generalization, and fine-grained control over both global and local adjustments. Notably, it outperforms GPT-4o with a <span class="highlight">60% improvement</span> in average pixel-level metrics on our MMArt-Bench benchmark while maintaining comparable instruction-following capabilities.
</p>
</div>
<div class="features">
<div class="feature">
<h3 class="feature-title">
<i class="fas fa-brain feature-icon"></i>
Professional Reasoning
</h3>
<p class="feature-text">
Mimics the reasoning process of professional artists through Chain-of-Thought supervised fine-tuning and GRPO-R optimization.
</p>
</div>
<div class="feature">
<h3 class="feature-title">
<i class="fas fa-tools feature-icon"></i>
Comprehensive Toolset
</h3>
<p class="feature-text">
Intelligently coordinates over 200 retouching tools within Lightroom for both global and local adjustments.
</p>
</div>
<div class="feature">
<h3 class="feature-title">
<i class="fas fa-user-astronaut feature-icon"></i>
User-Friendly Interaction
</h3>
<p class="feature-text">
Supports intuitive, free-form edits through natural inputs like text prompts, bounding boxes, or brushstrokes.
</p>
</div>
</div>
<div class="image-container">
<img src="https://cdn.vansin.top/papers/2506.17612/images/b1b85618f6f156005dab98b71efac19eb8379eb249721ebe9c59ebcd55ca3412.jpg" alt="JarvisArt Interface">
<div class="image-caption">
Figure 1: JarvisArt supports multi-granularity retouching through natural inputs and edits any-resolution images.
</div>
</div>
<div class="stats">
<div class="stat">
<div class="stat-value">200+</div>
<div class="stat-label">Retouching Tools</div>
</div>
<div class="stat">
<div class="stat-value">60%</div>
<div class="stat-label">Improvement over GPT-4o</div>
</div>
<div class="stat">
<div class="stat-value">55K</div>
<div class="stat-label">Training Samples</div>
</div>
<div class="stat">
<div class="stat-value"></div>
<div class="stat-label">Image Resolution Support</div>
</div>
</div>
</div>
<div class="footer">
JarvisArt: A new paradigm for intelligent photo retouching | https://jarvisart.vercel.app/
</div>
</div>
</body>
</html>