ProCreations
/

Pro-AI-TG

Model card Files Files and versions Community

ProCreations commited on Mar 17, 2024

Commit

686783c

·

verified ·

1 Parent(s): 524160c

Update tg.ggml

Files changed (1) hide show

tg.ggml +17 -5

tg.ggml CHANGED Viewed

@@ -11,7 +11,7 @@ model MyModel {
   // Embedding layer
   embeddings {
-    dim: 64;
   }
   // Encoder layers
@@ -19,13 +19,20 @@ model MyModel {
     type: lstm;
     units: 128;
     num_layers: 2;
   }
   // Decoder layers
   decoder {
     type: gru;
     units: 64;
-    num_layers: 1;
   }
   // Output layer
@@ -46,9 +53,14 @@ model MyModel {
   }
 }
-// Training parameters
-train {
-  // ... (Define training data and hyperparameters)
 }
 // Inference parameters

   // Embedding layer
   embeddings {
+    dim: 128;
   }
   // Encoder layers
     type: lstm;
     units: 128;
     num_layers: 2;
+    dropout: 0.2;  // Add dropout for regularization
   }
   // Decoder layers
   decoder {
     type: gru;
     units: 64;
+    num_layers: 2;
+    dropout: 0.1;  // Add dropout for regularization
+  }
+  // Attention mechanism
+  attention {
+    type: scaled_dot_product;
   }
   // Output layer
   }
 }
+// Training parameters (in train.json)
+{
+  "data_path": "path/to/your/training_data.txt",
+  "batch_size": 32,
+  "epochs": 10,
+  "use_scheduled_sampling": true,  // Enable scheduled sampling
+  "clip_gradients": 5.0,  // Add gradient clipping to prevent exploding gradients
+  "use_batch_norm": true  // Enable batch normalization
 }
 // Inference parameters