Juna190825 commited on
Commit
303bada
·
verified ·
1 Parent(s): 4476e77

Save model using Keras.

Browse files
Files changed (6) hide show
  1. .gitattributes +1 -0
  2. README.md +17 -0
  3. assets/summary_plot.png +3 -0
  4. config.json +1 -0
  5. metadata.json +1 -0
  6. model.weights.h5 +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ assets/summary_plot.png filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ ---
3
+ library_name: keras
4
+ ---
5
+
6
+ This model has been uploaded using the Keras library and can be used with JAX,
7
+ TensorFlow, and PyTorch backends.
8
+
9
+ This model card has been generated automatically and should be completed by the
10
+ model author.
11
+ See [Model Cards documentation](https://huggingface.co/docs/hub/model-cards) for
12
+ more information.
13
+
14
+ For more details about the model architecture, check out
15
+ [config.json](./config.json).
16
+
17
+ ![](./assets/summary_plot.png)
assets/summary_plot.png ADDED

Git LFS Details

  • SHA256: 28f9e9414b8b890760918b6f221caf25e81241341cd1333def8e5614e2d527fc
  • Pointer size: 131 Bytes
  • Size of remote file: 137 kB
config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"module": "keras.src.models.functional", "class_name": "Functional", "config": {"name": "functional_1", "trainable": true, "layers": [{"module": "keras.layers", "class_name": "InputLayer", "config": {"batch_shape": [null, null], "dtype": "int64", "sparse": false, "ragged": false, "name": "encoder_input"}, "registered_name": null, "name": "encoder_input", "inbound_nodes": []}, {"module": "keras_hub.src.layers.modeling.token_and_position_embedding", "class_name": "TokenAndPositionEmbedding", "config": {"name": "token_and_position_embedding", "trainable": true, "dtype": {"module": "keras", "class_name": "DTypePolicy", "config": {"name": "float32"}, "registered_name": null}, "vocabulary_size": 34407, "sequence_length": 210, "embedding_dim": 256, "embeddings_initializer": {"module": "keras.initializers", "class_name": "RandomUniform", "config": {"seed": null, "minval": -0.05, "maxval": 0.05}, "registered_name": null}, "tie_weights": true, "mask_zero": false}, "registered_name": "keras_hub>TokenAndPositionEmbedding", "build_config": {"input_shape": [null, null]}, "name": "token_and_position_embedding", "inbound_nodes": [{"args": [{"class_name": "__keras_tensor__", "config": {"shape": [null, null], "dtype": "int64", "keras_history": ["encoder_input", 0, 0]}}], "kwargs": {}}]}, {"module": "keras.layers", "class_name": "InputLayer", "config": {"batch_shape": [null, null], "dtype": "int64", "sparse": false, "ragged": false, "name": "decoder_input"}, "registered_name": null, "name": "decoder_input", "inbound_nodes": [], "shared_object_id": 135257918797968}, {"module": "keras_hub.src.layers.modeling.transformer_encoder", "class_name": "TransformerEncoder", "config": {"name": "transformer_encoder", "trainable": true, "dtype": {"module": "keras", "class_name": "DTypePolicy", "config": {"name": "float32"}, "registered_name": null, "shared_object_id": 135258055796560}, "intermediate_dim": 256, "num_heads": 8, "dropout": 0, "activation": "relu", "layer_norm_epsilon": 1e-05, "kernel_initializer": {"module": "keras.initializers", "class_name": "GlorotUniform", "config": {"seed": null}, "registered_name": null}, "bias_initializer": {"module": "keras.initializers", "class_name": "Zeros", "config": {}, "registered_name": null}, "normalize_first": false}, "registered_name": "keras_hub>TransformerEncoder", "build_config": {"input_shape": [null, null, 256]}, "name": "transformer_encoder", "inbound_nodes": [{"args": [{"class_name": "__keras_tensor__", "config": {"shape": [null, null, 256], "dtype": "float32", "keras_history": ["token_and_position_embedding", 0, 0]}}], "kwargs": {}}]}, {"module": "keras.src.models.functional", "class_name": "Functional", "config": {"name": "functional", "trainable": true, "layers": [{"module": "keras.layers", "class_name": "InputLayer", "config": {"batch_shape": [null, null], "dtype": "int64", "sparse": false, "ragged": false, "name": "decoder_input"}, "registered_name": null, "shared_object_id": 135257918797968, "name": "decoder_input", "inbound_nodes": []}, {"module": "keras_hub.src.layers.modeling.token_and_position_embedding", "class_name": "TokenAndPositionEmbedding", "config": {"name": "token_and_position_embedding_1", "trainable": true, "dtype": {"module": "keras", "class_name": "DTypePolicy", "config": {"name": "float32"}, "registered_name": null, "shared_object_id": 135258055796560}, "vocabulary_size": 51212, "sequence_length": 210, "embedding_dim": 256, "embeddings_initializer": {"module": "keras.initializers", "class_name": "RandomUniform", "config": {"seed": null, "minval": -0.05, "maxval": 0.05}, "registered_name": null}, "tie_weights": true, "mask_zero": true}, "registered_name": "keras_hub>TokenAndPositionEmbedding", "build_config": {"input_shape": [null, null]}, "name": "token_and_position_embedding_1", "inbound_nodes": [{"args": [{"class_name": "__keras_tensor__", "config": {"shape": [null, null], "dtype": "int64", "keras_history": ["decoder_input", 0, 0]}}], "kwargs": {}}]}, {"module": "keras.layers", "class_name": "InputLayer", "config": {"batch_shape": [null, null, 256], "dtype": "float32", "sparse": false, "ragged": false, "name": "input_layer"}, "registered_name": null, "name": "input_layer", "inbound_nodes": []}, {"module": "keras_hub.src.layers.modeling.transformer_decoder", "class_name": "TransformerDecoder", "config": {"name": "transformer_decoder", "trainable": true, "dtype": {"module": "keras", "class_name": "DTypePolicy", "config": {"name": "float32"}, "registered_name": null, "shared_object_id": 135258055796560}, "intermediate_dim": 256, "num_heads": 8, "dropout": 0, "activation": "relu", "layer_norm_epsilon": 1e-05, "kernel_initializer": {"module": "keras.initializers", "class_name": "GlorotUniform", "config": {"seed": null}, "registered_name": null}, "bias_initializer": {"module": "keras.initializers", "class_name": "Zeros", "config": {}, "registered_name": null}, "normalize_first": false, "decoder_sequence_shape": [null, null, 256], "encoder_sequence_shape": [null, null, 256]}, "registered_name": "keras_hub>TransformerDecoder", "build_config": {"shapes_dict": {"decoder_sequence_shape": [null, null, 256], "encoder_sequence_shape": [null, null, 256]}}, "name": "transformer_decoder", "inbound_nodes": [{"args": [{"class_name": "__keras_tensor__", "config": {"shape": [null, null, 256], "dtype": "float32", "keras_history": ["token_and_position_embedding_1", 0, 0]}}, {"class_name": "__keras_tensor__", "config": {"shape": [null, null, 256], "dtype": "float32", "keras_history": ["input_layer", 0, 0]}}], "kwargs": {}}]}, {"module": "keras.layers", "class_name": "Dropout", "config": {"name": "dropout_3", "trainable": true, "dtype": {"module": "keras", "class_name": "DTypePolicy", "config": {"name": "float32"}, "registered_name": null, "shared_object_id": 135258055796560}, "rate": 0.4, "seed": null, "noise_shape": null}, "registered_name": null, "name": "dropout_3", "inbound_nodes": [{"args": [{"class_name": "__keras_tensor__", "config": {"shape": [null, null, 256], "dtype": "float32", "keras_history": ["transformer_decoder", 0, 0]}}], "kwargs": {"training": false}}]}, {"module": "keras.layers", "class_name": "Dense", "config": {"name": "dense", "trainable": true, "dtype": {"module": "keras", "class_name": "DTypePolicy", "config": {"name": "float32"}, "registered_name": null, "shared_object_id": 135258055796560}, "units": 51212, "activation": "softmax", "use_bias": true, "kernel_initializer": {"module": "keras.initializers", "class_name": "GlorotUniform", "config": {"seed": null}, "registered_name": null}, "bias_initializer": {"module": "keras.initializers", "class_name": "Zeros", "config": {}, "registered_name": null}, "kernel_regularizer": null, "bias_regularizer": null, "kernel_constraint": null, "bias_constraint": null}, "registered_name": null, "build_config": {"input_shape": [null, null, 256]}, "name": "dense", "inbound_nodes": [{"args": [{"class_name": "__keras_tensor__", "config": {"shape": [null, null, 256], "dtype": "float32", "keras_history": ["dropout_3", 0, 0]}}], "kwargs": {}}]}], "input_layers": [["decoder_input", 0, 0], ["input_layer", 0, 0]], "output_layers": [["dense", 0, 0]]}, "registered_name": "Functional", "build_config": {"input_shape": null}, "compile_config": {}, "name": "functional", "inbound_nodes": [{"args": [[{"class_name": "__keras_tensor__", "config": {"shape": [null, null], "dtype": "int64", "keras_history": ["decoder_input", 0, 0]}}, {"class_name": "__keras_tensor__", "config": {"shape": [null, null, 256], "dtype": "float32", "keras_history": ["transformer_encoder", 0, 0]}}]], "kwargs": {"mask": [null, null]}}]}], "input_layers": [["encoder_input", 0, 0], ["decoder_input", 0, 0]], "output_layers": [["functional", 1, 0]]}, "registered_name": "Functional", "build_config": {"input_shape": null}, "compile_config": {"optimizer": {"module": "keras.optimizers", "class_name": "Adam", "config": {"name": "adam", "learning_rate": 0.0010000000474974513, "weight_decay": null, "clipnorm": null, "global_clipnorm": null, "clipvalue": null, "use_ema": false, "ema_momentum": 0.99, "ema_overwrite_frequency": null, "loss_scale_factor": null, "gradient_accumulation_steps": null, "beta_1": 0.9, "beta_2": 0.999, "epsilon": 1e-07, "amsgrad": false}, "registered_name": null}, "loss": "sparse_categorical_crossentropy", "loss_weights": null, "metrics": ["accuracy"], "weighted_metrics": null, "run_eagerly": false, "steps_per_execution": 1, "jit_compile": true}}
metadata.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"keras_version": "3.10.0", "date_saved": "2025-06-22@05:29:42"}
model.weights.h5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:622015a1fb86a700b091c279aff771b7bdfb642b6922743d431aa5fa6378346c
3
+ size 435073716