Upload 8 files
Browse files- .gitattributes +3 -0
- README.md +59 -0
- config.yaml +60 -0
- flux_train_replicate.safetensors +3 -0
- optimizer.pt +3 -0
- samples/HDRI panoramic view of TOK, inside of a beautiful japanese onsen with sakura tree, hot baths.webp +3 -0
- samples/HDRI panoramic view of TOK, inside of a fighter jet cockpit, flying in the air, over an aircraft carrier, in San Francisco bay.webp +0 -0
- samples/HDRI panoramic view of TOK, inside of an art gallery, very modern, luxurious stylish, with expensive marble and copper-plated stuff.webp +3 -0
- samples/HDRI panoramic view of TOK, visiting an amusement park about harry potter.webp +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
samples/HDRI[[:space:]]panoramic[[:space:]]view[[:space:]]of[[:space:]]TOK,[[:space:]]inside[[:space:]]of[[:space:]]a[[:space:]]beautiful[[:space:]]japanese[[:space:]]onsen[[:space:]]with[[:space:]]sakura[[:space:]]tree,[[:space:]]hot[[:space:]]baths.webp filter=lfs diff=lfs merge=lfs -text
|
37 |
+
samples/HDRI[[:space:]]panoramic[[:space:]]view[[:space:]]of[[:space:]]TOK,[[:space:]]inside[[:space:]]of[[:space:]]an[[:space:]]art[[:space:]]gallery,[[:space:]]very[[:space:]]modern,[[:space:]]luxurious[[:space:]]stylish,[[:space:]]with[[:space:]]expensive[[:space:]]marble[[:space:]]and[[:space:]]copper-plated[[:space:]]stuff.webp filter=lfs diff=lfs merge=lfs -text
|
38 |
+
samples/HDRI[[:space:]]panoramic[[:space:]]view[[:space:]]of[[:space:]]TOK,[[:space:]]visiting[[:space:]]an[[:space:]]amusement[[:space:]]park[[:space:]]about[[:space:]]harry[[:space:]]potter.webp filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: other
|
3 |
+
license_name: flux-1-dev-non-commercial-license
|
4 |
+
license_link: https://huggingface.co/black-forest-labs/FLUX.1-dev/blob/main/LICENSE.md
|
5 |
+
language:
|
6 |
+
- en
|
7 |
+
library_name: diffusers
|
8 |
+
pipeline_tag: text-to-image
|
9 |
+
base_model: black-forest-labs/FLUX.1-dev
|
10 |
+
tags:
|
11 |
+
- diffusers
|
12 |
+
- lora
|
13 |
+
- flux
|
14 |
+
inference:
|
15 |
+
parameters:
|
16 |
+
width: 1536
|
17 |
+
height: 640
|
18 |
+
widget:
|
19 |
+
- text: "HDRI panoramic view of TOK, visiting an amusement park about harry potter."
|
20 |
+
output:
|
21 |
+
url: "samples/HDRI panoramic view of TOK, visiting an amusement park about harry potter.webp"
|
22 |
+
- text: "HDRI panoramic view of TOK, inside of a beautiful japanese onsen with sakura tree, hot baths"
|
23 |
+
output:
|
24 |
+
url: "samples/HDRI panoramic view of TOK, inside of a beautiful japanese onsen with sakura tree, hot baths.webp"
|
25 |
+
- text: "HDRI panoramic view of TOK, inside of an art gallery, very modern, luxurious stylish, with expensive marble and copper-plated stuff"
|
26 |
+
output:
|
27 |
+
url: "samples/HDRI panoramic view of TOK, inside of an art gallery, very modern, luxurious stylish, with expensive marble and copper-plated stuff.webp"
|
28 |
+
- text: "HDRI panoramic view of TOK, inside of a fighter jet cockpit, flying in the air, over an aircraft carrier, in San Francisco bay"
|
29 |
+
output:
|
30 |
+
url: "samples/HDRI panoramic view of TOK, inside of a fighter jet cockpit, flying in the air, over an aircraft carrier, in San Francisco bay.webp"
|
31 |
+
---
|
32 |
+
|
33 |
+
<Gallery />
|
34 |
+
|
35 |
+
# FLUX.1-[dev] Panorama LoRA (v2)
|
36 |
+
|
37 |
+
A LoRA model to generate panoramas using Flux dev.
|
38 |
+
|
39 |
+
## Which image ratio to use?
|
40 |
+
|
41 |
+
This model has been trained on images with a 2:1 ratio (2048x1024).
|
42 |
+
|
43 |
+
So you might get good results is you use this for width and height.
|
44 |
+
|
45 |
+
However panorama viewers are pretty flexible when it comes to resolution, and FLUX.1 seems to generalize well.
|
46 |
+
|
47 |
+
For instance the gallery samples have been generated in 1536 × 640 (~21:9), since this is reasonably fast (16 sec on the HF Inference API).
|
48 |
+
|
49 |
+
## It doesn't work for case X or Y
|
50 |
+
|
51 |
+
It usually work fine for "normal" requests, but the model might have trouble creating the spherical distortion if you ask for uncommon content, locations or angles.
|
52 |
+
|
53 |
+
If you give me some examples, maybe I can try to find more data to better cover uncommon panoramas.
|
54 |
+
|
55 |
+
## Non-commercial use
|
56 |
+
|
57 |
+
As the base model is FLUX.1-[dev] and since the data comes from Google Street View, it should be used for [non-commercial, personal or demonstration purposes only](https://github.com/black-forest-labs/flux/blob/main/model_licenses/LICENSE-FLUX1-dev).
|
58 |
+
|
59 |
+
Please use it responsibly, thank you!
|
config.yaml
ADDED
@@ -0,0 +1,60 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
config:
|
2 |
+
name: flux_train_replicate
|
3 |
+
process:
|
4 |
+
- datasets:
|
5 |
+
- cache_latents_to_disk: true
|
6 |
+
caption_dropout_rate: 0.05
|
7 |
+
caption_ext: filename
|
8 |
+
folder_path: input_images
|
9 |
+
resolution:
|
10 |
+
- 512
|
11 |
+
- 768
|
12 |
+
- 1024
|
13 |
+
shuffle_tokens: false
|
14 |
+
device: cuda:0
|
15 |
+
model:
|
16 |
+
is_flux: true
|
17 |
+
name_or_path: black-forest-labs/FLUX.1-dev
|
18 |
+
quantize: true
|
19 |
+
network:
|
20 |
+
linear: 16
|
21 |
+
linear_alpha: 16
|
22 |
+
type: lora
|
23 |
+
sample:
|
24 |
+
guidance_scale: 4
|
25 |
+
height: 1024
|
26 |
+
neg: ''
|
27 |
+
prompts:
|
28 |
+
- a sign that says 'I LOVE PROMPTS!' in the style of [trigger]
|
29 |
+
sample_every: 250
|
30 |
+
sample_steps: 20
|
31 |
+
sampler: flowmatch
|
32 |
+
seed: 42
|
33 |
+
walk_seed: true
|
34 |
+
width: 1024
|
35 |
+
save:
|
36 |
+
dtype: float16
|
37 |
+
max_step_saves_to_keep: 1
|
38 |
+
save_every: 2001
|
39 |
+
train:
|
40 |
+
batch_size: 1
|
41 |
+
content_or_style: balanced
|
42 |
+
dtype: bf16
|
43 |
+
ema_config:
|
44 |
+
ema_decay: 0.99
|
45 |
+
use_ema: true
|
46 |
+
gradient_accumulation_steps: 1
|
47 |
+
gradient_checkpointing: true
|
48 |
+
lr: 0.0004
|
49 |
+
noise_scheduler: flowmatch
|
50 |
+
optimizer: adamw8bit
|
51 |
+
steps: 2000
|
52 |
+
train_text_encoder: false
|
53 |
+
train_unet: true
|
54 |
+
training_folder: output
|
55 |
+
trigger_word: TOK
|
56 |
+
type: sd_trainer
|
57 |
+
job: extension
|
58 |
+
meta:
|
59 |
+
name: flux_train_replicate
|
60 |
+
version: '1.0'
|
flux_train_replicate.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dea506dc7b0923ee5e693449c122d8ecad700c54d78d7096a74d43c99d4a398e
|
3 |
+
size 171969416
|
optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09c98bb0b2280145810efaf224f4cce47d55b5fcfae123ebeac4276b0498c9d3
|
3 |
+
size 173272836
|
samples/HDRI panoramic view of TOK, inside of a beautiful japanese onsen with sakura tree, hot baths.webp
ADDED
![]() |
Git LFS Details
|
samples/HDRI panoramic view of TOK, inside of a fighter jet cockpit, flying in the air, over an aircraft carrier, in San Francisco bay.webp
ADDED
![]() |
samples/HDRI panoramic view of TOK, inside of an art gallery, very modern, luxurious stylish, with expensive marble and copper-plated stuff.webp
ADDED
![]() |
Git LFS Details
|
samples/HDRI panoramic view of TOK, visiting an amusement park about harry potter.webp
ADDED
![]() |
Git LFS Details
|