Spaces:

flax-community
/

dalle-mini

Running

valhalla commited on Oct 19, 2021

Commit

e5a52b9

1 Parent(s): a265819

add property to get num params

Files changed (1) hide show

dalle_mini/modeling_bart_flax.py CHANGED Viewed

@@ -24,6 +24,7 @@ import flax.linen as nn
 import jax
 import jax.numpy as jnp
 from flax.core.frozen_dict import FrozenDict, unfreeze
 from flax.linen import combine_masks, make_causal_mask
 from flax.linen.attention import dot_product_attention_weights
 from jax import lax
@@ -622,6 +623,11 @@ class FlaxBartPreTrainedModel(FlaxPreTrainedModel):
         module = self.module_class(config=config, dtype=dtype)
         super().__init__(config, module, input_shape=input_shape, seed=seed, dtype=dtype, **kwargs)
     def init_weights(self, rng: jax.random.PRNGKey, input_shape: Tuple) -> FrozenDict:
         # init input tensors
         input_ids = jnp.zeros(input_shape, dtype="i4")

 import jax
 import jax.numpy as jnp
 from flax.core.frozen_dict import FrozenDict, unfreeze
+from flax.traverse_util import flatten_dict
 from flax.linen import combine_masks, make_causal_mask
 from flax.linen.attention import dot_product_attention_weights
 from jax import lax
         module = self.module_class(config=config, dtype=dtype)
         super().__init__(config, module, input_shape=input_shape, seed=seed, dtype=dtype, **kwargs)
+    @property
+    def num_params(self):
+        num_params = jax.tree_map(lambda param: param.size, flatten_dict(unfreeze(self.params))).values()
+        return sum(list(num_params))
     def init_weights(self, rng: jax.random.PRNGKey, input_shape: Tuple) -> FrozenDict:
         # init input tensors
         input_ids = jnp.zeros(input_shape, dtype="i4")