autoencoder works

ariG23498 · ariG23498 · commit 58e7e932eeb2 · 2024-10-09T18:17:16.000Z
diff --git a/jflux/modules/autoencoder.py b/jflux/modules/autoencoder.py
@@ -85,7 +85,7 @@ def attention(self, h_: Array) -> Array:
         v = rearrange(v, "b h w c-> b (h w) 1 c")
 
         # Calculate Attention
-        h_ = nnx.dot_product_attention(q, k, v)
+        h_ = jax.nn.dot_product_attention(q, k, v)
 
         return rearrange(h_, "b (h w) 1 c -> b h w c", h=h, w=w, c=c, b=b)
 
diff --git a/jflux/util.py b/jflux/util.py
@@ -4,6 +4,7 @@
 import torch  # need for t5 and clip
 from flax import nnx
 from huggingface_hub import hf_hub_download
+import jax
 from jax import numpy as jnp
 from safetensors import safe_open
 
@@ -12,6 +13,11 @@
 from jflux.modules.conditioner import HFEmbedder
 from jflux.port import port_autoencoder, port_flux
 
+def torch2jax(torch_tensor):
+    intermediate_tensor = torch_tensor.to(torch.float32)
+    jax_tensor = jnp.array(intermediate_tensor, dtype=jnp.bfloat16)
+    return jax_tensor
+
 
 @dataclass
 class ModelSpec:
@@ -127,9 +133,10 @@ def load_flow_model(name: str, hf_download: bool = True) -> Flux:
 
     if ckpt_path is not None:
         tensors = {}
-        with safe_open(ckpt_path, framework="flax") as f:
+        with safe_open(ckpt_path, framework="pt") as f:
             for k in f.keys():
-                tensors[k] = f.get_tensor(k)
+                with jax.default_device(jax.devices("cpu")[0]):
+                    tensors[k] = torch2jax(f.get_tensor(k))
 
         model = port_flux(flux=model, tensors=tensors)
         del tensors
@@ -166,9 +173,10 @@ def load_ae(name: str, hf_download: bool = True) -> AutoEncoder:
 
     if ckpt_path is not None:
         tensors = {}
-        with safe_open(ckpt_path, framework="flax") as f:
+        with safe_open(ckpt_path, framework="pt") as f:
             for k in f.keys():
-                tensors[k] = f.get_tensor(k)
+                with jax.default_device(jax.devices("cpu")[0]):
+                    tensors[k] = torch2jax(f.get_tensor(k))
 
         ae = port_autoencoder(autoencoder=ae, tensors=tensors)
         del tensors