|
|
|
�+root"_tf_keras_network*�+{"name": "text_encoder_1", "trainable": true, "expects_training_arg": true, "dtype": "float32", "batch_input_shape": null, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": false, "class_name": "TextEncoder", "config": {"name": "text_encoder_1", "layers": [{"class_name": "InputLayer", "config": {"batch_input_shape": {"class_name": "__tuple__", "items": [null, 77]}, "dtype": "int32", "sparse": false, "ragged": false, "name": "tokens"}, "name": "tokens", "inbound_nodes": []}, {"class_name": "InputLayer", "config": {"batch_input_shape": {"class_name": "__tuple__", "items": [null, 77]}, "dtype": "int32", "sparse": false, "ragged": false, "name": "positions"}, "name": "positions", "inbound_nodes": []}, {"class_name": "CLIPEmbedding", "config": {"name": "clip_embedding_1", "trainable": true, "dtype": "float32", "input_dim": 49409, "output_dim": 768, "max_length": 77}, "name": "clip_embedding_1", "inbound_nodes": [[["tokens", 0, 0, {}], ["positions", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_12", "inbound_nodes": [[["clip_embedding_1", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_13", "inbound_nodes": [[["clip_encoder_layer_12", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_14", "inbound_nodes": [[["clip_encoder_layer_13", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_15", "inbound_nodes": [[["clip_encoder_layer_14", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_16", "inbound_nodes": [[["clip_encoder_layer_15", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_17", "inbound_nodes": [[["clip_encoder_layer_16", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_18", "inbound_nodes": [[["clip_encoder_layer_17", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_19", "inbound_nodes": [[["clip_encoder_layer_18", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_20", "inbound_nodes": [[["clip_encoder_layer_19", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_21", "inbound_nodes": [[["clip_encoder_layer_20", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_22", "inbound_nodes": [[["clip_encoder_layer_21", 0, 0, {}]]]}, {"class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "name": "clip_encoder_layer_23", "inbound_nodes": [[["clip_encoder_layer_22", 0, 0, {}]]]}, {"class_name": "LayerNormalization", "config": {"name": "layer_normalization_49", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}}, "gamma_initializer": {"class_name": "Ones", "config": {}}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "name": "layer_normalization_49", "inbound_nodes": [[["clip_encoder_layer_23", 0, 0, {}]]]}], "input_layers": [["tokens", 0, 0], ["positions", 0, 0]], "output_layers": [["layer_normalization_49", 0, 0]]}, "shared_object_id": 6, "input_spec": [{"class_name": "InputSpec", "config": {"dtype": null, "shape": {"class_name": "__tuple__", "items": [null, 77]}, "ndim": 2, "max_ndim": null, "min_ndim": null, "axes": {}}}, {"class_name": "InputSpec", "config": {"dtype": null, "shape": {"class_name": "__tuple__", "items": [null, 77]}, "ndim": 2, "max_ndim": null, "min_ndim": null, "axes": {}}}], "build_input_shape": [{"class_name": "TensorShape", "items": [null, 77]}, {"class_name": "TensorShape", "items": [null, 77]}], "is_graph_network": true, "full_save_spec": {"class_name": "__tuple__", "items": [[[{"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [null, 77]}, "int32", "tokens"]}, {"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [null, 77]}, "int32", "positions"]}]], {}]}, "save_spec": [{"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [null, 77]}, "int32", "tokens"]}, {"class_name": "TypeSpec", "type_spec": "tf.TensorSpec", "serialized": [{"class_name": "TensorShape", "items": [null, 77]}, "int32", "positions"]}], "keras_version": "2.11.0", "backend": "tensorflow", "model_config": {"class_name": "TextEncoder"}, "training_config": {"loss": null, "metrics": null, "weighted_metrics": null, "loss_weights": null, "optimizer_config": {"class_name": "Custom>RMSprop", "config": {"name": "RMSprop", "weight_decay": null, "clipnorm": null, "global_clipnorm": null, "clipvalue": null, "use_ema": false, "ema_momentum": 0.99, "ema_overwrite_frequency": 100, "jit_compile": true, "is_legacy_optimizer": false, "learning_rate": 0.0010000000474974513, "rho": 0.9, "momentum": 0.0, "epsilon": 1e-07, "centered": false}}}}2 |
|
�root.layer-0"_tf_keras_input_layer*�{"class_name": "InputLayer", "name": "tokens", "dtype": "int32", "sparse": false, "ragged": false, "batch_input_shape": {"class_name": "__tuple__", "items": [null, 77]}, "config": {"batch_input_shape": {"class_name": "__tuple__", "items": [null, 77]}, "dtype": "int32", "sparse": false, "ragged": false, "name": "tokens"}}2 |
|
�root.layer-1"_tf_keras_input_layer*�{"class_name": "InputLayer", "name": "positions", "dtype": "int32", "sparse": false, "ragged": false, "batch_input_shape": {"class_name": "__tuple__", "items": [null, 77]}, "config": {"batch_input_shape": {"class_name": "__tuple__", "items": [null, 77]}, "dtype": "int32", "sparse": false, "ragged": false, "name": "positions"}}2 |
|
�root.layer_with_weights-0"_tf_keras_layer*�{"name": "clip_embedding_1", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEmbedding", "config": {"name": "clip_embedding_1", "trainable": true, "dtype": "float32", "input_dim": 49409, "output_dim": 768, "max_length": 77}, "inbound_nodes": [[["tokens", 0, 0, {}], ["positions", 0, 0, {}]]], "shared_object_id": 2, "build_input_shape": [{"class_name": "TensorShape", "items": [null, 77]}, {"class_name": "TensorShape", "items": [null, 77]}]}2 |
|
�root.layer_with_weights-1"_tf_keras_layer*�{"name": "clip_encoder_layer_12", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�root.layer_with_weights-2"_tf_keras_layer*�{"name": "clip_encoder_layer_13", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�root.layer_with_weights-3"_tf_keras_layer*�{"name": "clip_encoder_layer_14", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�root.layer_with_weights-4"_tf_keras_layer*�{"name": "clip_encoder_layer_15", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�root.layer_with_weights-5"_tf_keras_layer*�{"name": "clip_encoder_layer_16", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
� root.layer_with_weights-6"_tf_keras_layer*�{"name": "clip_encoder_layer_17", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
� |
|
root.layer_with_weights-7"_tf_keras_layer*�{"name": "clip_encoder_layer_18", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�root.layer_with_weights-8"_tf_keras_layer*�{"name": "clip_encoder_layer_19", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�root.layer_with_weights-9"_tf_keras_layer*�{"name": "clip_encoder_layer_20", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�
root.layer_with_weights-10"_tf_keras_layer*�{"name": "clip_encoder_layer_21", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�root.layer_with_weights-11"_tf_keras_layer*�{"name": "clip_encoder_layer_22", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�root.layer_with_weights-12"_tf_keras_layer*�{"name": "clip_encoder_layer_23", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPEncoderLayer", "config": {"layer was saved without config": true}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�root.layer_with_weights-13"_tf_keras_layer*�{"name": "layer_normalization_49", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_49", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 3}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 4}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "inbound_nodes": [[["clip_encoder_layer_23", 0, 0, {}]]], "shared_object_id": 5, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�!)root.layer_with_weights-0.token_embedding"_tf_keras_layer*�{"name": "embedding_2", "trainable": true, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": {"class_name": "__tuple__", "items": [null, null]}, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": false, "class_name": "Embedding", "config": {"name": "embedding_2", "trainable": true, "dtype": "float32", "batch_input_shape": {"class_name": "__tuple__", "items": [null, null]}, "input_dim": 49409, "output_dim": 768, "embeddings_initializer": {"class_name": "RandomUniform", "config": {"minval": -0.05, "maxval": 0.05, "seed": null}, "shared_object_id": 9}, "embeddings_regularizer": null, "activity_regularizer": null, "embeddings_constraint": null, "mask_zero": false, "input_length": null}, "shared_object_id": 10, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77]}}2 |
|
�",root.layer_with_weights-0.position_embedding"_tf_keras_layer*�{"name": "embedding_3", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": {"class_name": "__tuple__", "items": [null, null]}, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": false, "class_name": "Embedding", "config": {"name": "embedding_3", "trainable": false, "dtype": "float32", "batch_input_shape": {"class_name": "__tuple__", "items": [null, null]}, "input_dim": 77, "output_dim": 768, "embeddings_initializer": {"class_name": "RandomUniform", "config": {"minval": -0.05, "maxval": 0.05, "seed": null}, "shared_object_id": 11}, "embeddings_regularizer": null, "activity_regularizer": null, "embeddings_constraint": null, "mask_zero": false, "input_length": null}, "shared_object_id": 12, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77]}}2 |
|
�)%root.layer_with_weights-1.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_25", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_25", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 13}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 14}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 15, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�*#root.layer_with_weights-1.clip_attn"_tf_keras_layer*�{"name": "clip_attention_12", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_12", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 16, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�+%root.layer_with_weights-1.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_26", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_26", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 17}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 18}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 19, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�,root.layer_with_weights-1.fc1"_tf_keras_layer*�{"name": "dense_76", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_76", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 20}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 21}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 22, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 23}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�-root.layer_with_weights-1.fc2"_tf_keras_layer*�{"name": "dense_77", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_77", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 24}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 25}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 26, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 27}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
�4%root.layer_with_weights-2.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_27", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_27", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 28}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 29}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 30, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�5#root.layer_with_weights-2.clip_attn"_tf_keras_layer*�{"name": "clip_attention_13", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_13", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 31, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�6%root.layer_with_weights-2.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_28", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_28", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 32}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 33}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 34, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�7root.layer_with_weights-2.fc1"_tf_keras_layer*�{"name": "dense_82", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_82", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 35}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 36}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 37, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 38}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�8root.layer_with_weights-2.fc2"_tf_keras_layer*�{"name": "dense_83", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_83", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 39}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 40}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 41, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 42}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
�?%root.layer_with_weights-3.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_29", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_29", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 43}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 44}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 45, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�@#root.layer_with_weights-3.clip_attn"_tf_keras_layer*�{"name": "clip_attention_14", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_14", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 46, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�A%root.layer_with_weights-3.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_30", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_30", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 47}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 48}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 49, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�Broot.layer_with_weights-3.fc1"_tf_keras_layer*�{"name": "dense_88", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_88", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 50}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 51}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 52, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 53}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�Croot.layer_with_weights-3.fc2"_tf_keras_layer*�{"name": "dense_89", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_89", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 54}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 55}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 56, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 57}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
�J%root.layer_with_weights-4.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_31", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_31", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 58}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 59}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 60, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�K#root.layer_with_weights-4.clip_attn"_tf_keras_layer*�{"name": "clip_attention_15", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_15", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 61, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�L%root.layer_with_weights-4.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_32", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_32", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 62}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 63}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 64, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�Mroot.layer_with_weights-4.fc1"_tf_keras_layer*�{"name": "dense_94", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_94", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 65}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 66}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 67, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 68}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�Nroot.layer_with_weights-4.fc2"_tf_keras_layer*�{"name": "dense_95", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_95", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 69}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 70}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 71, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 72}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
�U%root.layer_with_weights-5.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_33", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_33", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 73}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 74}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 75, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�V#root.layer_with_weights-5.clip_attn"_tf_keras_layer*�{"name": "clip_attention_16", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_16", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 76, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�W%root.layer_with_weights-5.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_34", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_34", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 77}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 78}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 79, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�Xroot.layer_with_weights-5.fc1"_tf_keras_layer*�{"name": "dense_100", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_100", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 80}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 81}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 82, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 83}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�Yroot.layer_with_weights-5.fc2"_tf_keras_layer*�{"name": "dense_101", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_101", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 84}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 85}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 86, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 87}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
�`%root.layer_with_weights-6.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_35", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_35", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 88}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 89}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 90, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�a#root.layer_with_weights-6.clip_attn"_tf_keras_layer*�{"name": "clip_attention_17", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_17", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 91, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�b%root.layer_with_weights-6.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_36", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_36", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 92}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 93}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 94, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�croot.layer_with_weights-6.fc1"_tf_keras_layer*�{"name": "dense_106", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_106", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 95}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 96}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 97, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 98}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�droot.layer_with_weights-6.fc2"_tf_keras_layer*�{"name": "dense_107", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_107", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 99}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 100}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 101, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 102}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
�k%root.layer_with_weights-7.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_37", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_37", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 103}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 104}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 105, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�l#root.layer_with_weights-7.clip_attn"_tf_keras_layer*�{"name": "clip_attention_18", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_18", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 106, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�m%root.layer_with_weights-7.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_38", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_38", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 107}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 108}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 109, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�nroot.layer_with_weights-7.fc1"_tf_keras_layer*�{"name": "dense_112", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_112", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 110}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 111}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 112, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 113}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�oroot.layer_with_weights-7.fc2"_tf_keras_layer*�{"name": "dense_113", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_113", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 114}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 115}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 116, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 117}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
�v%root.layer_with_weights-8.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_39", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_39", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 118}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 119}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 120, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�w#root.layer_with_weights-8.clip_attn"_tf_keras_layer*�{"name": "clip_attention_19", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_19", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 121, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�x%root.layer_with_weights-8.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_40", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_40", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 122}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 123}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 124, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�yroot.layer_with_weights-8.fc1"_tf_keras_layer*�{"name": "dense_118", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_118", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 125}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 126}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 127, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 128}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
�zroot.layer_with_weights-8.fc2"_tf_keras_layer*�{"name": "dense_119", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_119", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 129}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 130}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 131, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 132}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
��%root.layer_with_weights-9.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_41", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_41", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 133}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 134}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 135, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��#root.layer_with_weights-9.clip_attn"_tf_keras_layer*�{"name": "clip_attention_20", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_20", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 136, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��%root.layer_with_weights-9.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_42", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_42", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 137}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 138}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 139, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��root.layer_with_weights-9.fc1"_tf_keras_layer*�{"name": "dense_124", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_124", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 140}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 141}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 142, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 143}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��root.layer_with_weights-9.fc2"_tf_keras_layer*�{"name": "dense_125", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_125", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 144}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 145}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 146, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 147}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
��&root.layer_with_weights-10.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_43", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_43", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 148}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 149}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 150, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��$root.layer_with_weights-10.clip_attn"_tf_keras_layer*�{"name": "clip_attention_21", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_21", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 151, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��&root.layer_with_weights-10.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_44", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_44", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 152}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 153}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 154, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��root.layer_with_weights-10.fc1"_tf_keras_layer*�{"name": "dense_130", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_130", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 155}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 156}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 157, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 158}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��root.layer_with_weights-10.fc2"_tf_keras_layer*�{"name": "dense_131", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_131", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 159}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 160}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 161, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 162}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
��&root.layer_with_weights-11.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_45", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_45", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 163}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 164}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 165, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��$root.layer_with_weights-11.clip_attn"_tf_keras_layer*�{"name": "clip_attention_22", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_22", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 166, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��&root.layer_with_weights-11.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_46", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_46", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 167}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 168}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 169, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��root.layer_with_weights-11.fc1"_tf_keras_layer*�{"name": "dense_136", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_136", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 170}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 171}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 172, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 173}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��root.layer_with_weights-11.fc2"_tf_keras_layer*�{"name": "dense_137", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_137", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 174}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 175}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 176, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 177}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
��&root.layer_with_weights-12.layer_norm1"_tf_keras_layer*�{"name": "layer_normalization_47", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_47", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 178}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 179}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 180, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��$root.layer_with_weights-12.clip_attn"_tf_keras_layer*�{"name": "clip_attention_23", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "CLIPAttention", "config": {"name": "clip_attention_23", "trainable": false, "dtype": "float32", "causal": true, "embed_dim": 768, "num_heads": 12}, "shared_object_id": 181, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��&root.layer_with_weights-12.layer_norm2"_tf_keras_layer*�{"name": "layer_normalization_48", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "LayerNormalization", "config": {"name": "layer_normalization_48", "trainable": false, "dtype": "float32", "axis": [2], "epsilon": 1e-05, "center": true, "scale": true, "beta_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 182}, "gamma_initializer": {"class_name": "Ones", "config": {}, "shared_object_id": 183}, "beta_regularizer": null, "gamma_regularizer": null, "beta_constraint": null, "gamma_constraint": null}, "shared_object_id": 184, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��root.layer_with_weights-12.fc1"_tf_keras_layer*�{"name": "dense_142", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_142", "trainable": false, "dtype": "float32", "units": 3072, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 185}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 186}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 187, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 188}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��root.layer_with_weights-12.fc2"_tf_keras_layer*�{"name": "dense_143", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_143", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 189}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 190}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 191, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 3072}}, "shared_object_id": 192}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 3072]}}2 |
|
��*root.layer_with_weights-1.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_72", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_72", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 193}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 194}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 195, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 196}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-1.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_73", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_73", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 197}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 198}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 199, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 200}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-1.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_74", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_74", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 201}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 202}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 203, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 204}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��,root.layer_with_weights-1.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_75", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_75", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 205}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 206}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 207, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 208}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-2.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_78", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_78", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 209}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 210}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 211, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 212}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-2.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_79", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_79", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 213}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 214}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 215, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 216}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-2.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_80", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_80", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 217}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 218}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 219, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 220}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��,root.layer_with_weights-2.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_81", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_81", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 221}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 222}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 223, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 224}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-3.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_84", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_84", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 225}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 226}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 227, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 228}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-3.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_85", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_85", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 229}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 230}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 231, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 232}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-3.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_86", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_86", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 233}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 234}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 235, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 236}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��,root.layer_with_weights-3.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_87", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_87", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 237}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 238}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 239, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 240}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-4.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_90", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_90", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 241}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 242}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 243, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 244}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-4.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_91", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_91", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 245}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 246}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 247, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 248}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-4.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_92", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_92", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 249}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 250}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 251, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 252}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��,root.layer_with_weights-4.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_93", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_93", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 253}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 254}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 255, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 256}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-5.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_96", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_96", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 257}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 258}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 259, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 260}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-5.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_97", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_97", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 261}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 262}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 263, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 264}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-5.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_98", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_98", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 265}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 266}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 267, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 268}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��,root.layer_with_weights-5.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_99", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_99", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 269}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 270}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 271, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 272}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-6.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_102", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_102", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 273}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 274}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 275, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 276}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-6.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_103", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_103", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 277}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 278}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 279, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 280}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-6.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_104", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_104", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 281}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 282}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 283, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 284}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��,root.layer_with_weights-6.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_105", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_105", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 285}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 286}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 287, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 288}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-7.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_108", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_108", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 289}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 290}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 291, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 292}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-7.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_109", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_109", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 293}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 294}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 295, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 296}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-7.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_110", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_110", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 297}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 298}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 299, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 300}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��,root.layer_with_weights-7.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_111", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_111", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 301}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 302}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 303, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 304}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-8.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_114", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_114", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 305}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 306}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 307, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 308}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-8.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_115", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_115", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 309}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 310}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 311, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 312}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-8.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_116", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_116", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 313}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 314}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 315, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 316}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��,root.layer_with_weights-8.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_117", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_117", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 317}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 318}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 319, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 320}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-9.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_120", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_120", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 321}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 322}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 323, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 324}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-9.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_121", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_121", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 325}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 326}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 327, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 328}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��*root.layer_with_weights-9.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_122", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_122", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 329}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 330}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 331, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 332}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��,root.layer_with_weights-9.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_123", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_123", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 333}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 334}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 335, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 336}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��+root.layer_with_weights-10.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_126", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_126", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 337}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 338}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 339, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 340}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��+root.layer_with_weights-10.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_127", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_127", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 341}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 342}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 343, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 344}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��+root.layer_with_weights-10.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_128", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_128", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 345}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 346}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 347, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 348}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��-root.layer_with_weights-10.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_129", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_129", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 349}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 350}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 351, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 352}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��+root.layer_with_weights-11.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_132", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_132", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 353}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 354}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 355, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 356}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��+root.layer_with_weights-11.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_133", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_133", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 357}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 358}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 359, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 360}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��+root.layer_with_weights-11.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_134", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_134", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 361}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 362}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 363, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 364}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��-root.layer_with_weights-11.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_135", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_135", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 365}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 366}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 367, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 368}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��+root.layer_with_weights-12.clip_attn.q_proj"_tf_keras_layer*�{"name": "dense_138", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_138", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 369}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 370}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 371, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 372}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��+root.layer_with_weights-12.clip_attn.k_proj"_tf_keras_layer*�{"name": "dense_139", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_139", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 373}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 374}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 375, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 376}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��+root.layer_with_weights-12.clip_attn.v_proj"_tf_keras_layer*�{"name": "dense_140", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_140", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 377}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 378}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 379, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 380}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��-root.layer_with_weights-12.clip_attn.out_proj"_tf_keras_layer*�{"name": "dense_141", "trainable": false, "expects_training_arg": false, "dtype": "float32", "batch_input_shape": null, "stateful": false, "must_restore_from_config": false, "preserve_input_structure_in_config": false, "autocast": true, "class_name": "Dense", "config": {"name": "dense_141", "trainable": false, "dtype": "float32", "units": 768, "activation": "linear", "use_bias": true, "kernel_initializer": {"class_name": "GlorotUniform", "config": {"seed": null}, "shared_object_id": 381}, "bias_initializer": {"class_name": "Zeros", "config": {}, "shared_object_id": 382}, "kernel_regularizer": null, "bias_regularizer": null, "activity_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "shared_object_id": 383, "input_spec": {"class_name": "InputSpec", "config": {"dtype": null, "shape": null, "ndim": null, "max_ndim": null, "min_ndim": 2, "axes": {"-1": 768}}, "shared_object_id": 384}, "build_input_shape": {"class_name": "TensorShape", "items": [null, 77, 768]}}2 |
|
��root.keras_api.metrics.0"_tf_keras_metric*�{"class_name": "Mean", "name": "loss", "dtype": "float32", "config": {"name": "loss", "dtype": "float32"}, "shared_object_id": 385}2 |