Upload README.md with huggingface_hub
Browse files
README.md
CHANGED
@@ -1,3 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
# Aligned Diffusion Model via DPO
|
2 |
|
3 |
Diffusion Model Aligned with thef following reward model and DPO algorithm
|
@@ -33,4 +41,14 @@ prompt = "a pink flower"
|
|
33 |
|
34 |
image = pipeline(prompt=prompt, generator=generator, guidance_scale=gs).images[0]
|
35 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
36 |
```
|
|
|
1 |
+
---
|
2 |
+
tags:
|
3 |
+
- stable-diffusion
|
4 |
+
- stable-diffusion-diffusers
|
5 |
+
- text-to-image
|
6 |
+
inference: true
|
7 |
+
---
|
8 |
+
|
9 |
# Aligned Diffusion Model via DPO
|
10 |
|
11 |
Diffusion Model Aligned with thef following reward model and DPO algorithm
|
|
|
41 |
|
42 |
image = pipeline(prompt=prompt, generator=generator, guidance_scale=gs).images[0]
|
43 |
|
44 |
+
```
|
45 |
+
|
46 |
+
|
47 |
+
## Citation
|
48 |
+
```
|
49 |
+
@misc{mjbench2024mjbench,
|
50 |
+
title={MJ-BENCH: Is Your Multimodal Reward Model Really a Good Judge?},
|
51 |
+
author={Zhaorun Chen*, Yichao Du*, Zichen Wen, Yiyang Zhou, Chenhang Cui, Zhenzhen Weng, Haoqin Tu, Chaoqi Wang, Zhengwei Tong, Leria HUANG, Canyu Chen, Qinghao Ye, Zhihong Zhu, Yuqing Zhang, Jiawei Zhou, Zhuokai Zhao, Rafael Rafailov, Chelsea Finn, Huaxiu Yao},
|
52 |
+
year={2024}
|
53 |
+
}
|
54 |
```
|