Bertug1911
/

Br-T-1.5

Text2Text Generation

Adapters

Turkish

code

Model card Files Files and versions Community

Bertug1911 commited on Jan 27

Commit

cdad224

verified ·

1 Parent(s): 8a18b4d

Upload Br-T-1.5.py

Browse files

Files changed (1) hide show

Br-T-1.5.py +135 -0

Br-T-1.5.py ADDED Viewed

	@@ -0,0 +1,135 @@

+import os
+import re
+import numpy as np
+from gensim.models import Word2Vec
+from tensorflow.keras.models import Sequential
+from tensorflow.keras.layers import Dense, LSTM, Embedding, GRU, Dropout
+from tensorflow.keras.preprocessing.text import Tokenizer
+from tensorflow.keras.preprocessing.sequence import pad_sequences
+from tensorflow.keras.layers import Layer, MultiHeadAttention, LayerNormalization
+# === PARAMETRE AÇIKLAMALARI VE AYARLARI ===
+max_worker = os.cpu_count()                      # İşlemcideki toplam çekirdek sayısı
+vector_size = 1000                               # Word2Vec modelinin her kelime için vektör boyutu
+window_size = 50                                 # Word2Vec’te komşuluk penceresi boyutu
+min_count = 1                                    # Word2Vec’te dikkate alınacak minimum kelime frekansı
+context_length = 256                             # Modelin giriş dizilerinin maksimum uzunluğu
+sentence_length = 5                              # Üretilen cümlelerin maksimum uzunluğu
+# Transformer Encoder Parametreleri
+embed_dim = 128                                  # Girdilerin (kelimelerin) vektörel boyutu
+num_heads = 4                                    # Multi-Head Attention mekanizmasındaki başlık sayısı
+feed_forward_dim = 512                           # Feed-Forward Network içindeki ara katman boyutu
+dropout_rate_transformer = 0.1                   # Transformer Encoder için Dropout oranı
+epsilon = 1e-6                                   # LayerNormalization stabilitesi için kullanılan sabit
+# LSTM ve GRU Katman Parametreleri
+lstm_units = [16000, 16000, 16000, 8000, 4096]   # Her LSTM katmanındaki nöron sayısı
+gru_units = [2048, 2048, 1024, 1024, 512, 256, 128, 64, 32, 16, 8, 4, 2, 1]  # Her GRU katmanındaki nöron sayıları
+dropout_rate_rnn = 0.1                           # LSTM ve GRU için ortak Dropout oranı
+return_sequences = True                          # LSTM ve GRU'da tüm zaman adımlarını döndürme parametresi
+# Embedding Katman Parametreleri
+input_dim = 10000                                # Girişteki toplam kelime sayısı (vocab size)
+output_dim = 1000                                # Her kelimenin vektörel boyutu
+input_length = context_length                    # Girişteki maksimum dizi uzunluğu
+# Dense Katman Parametreleri
+dense_units = input_dim                          # Dense katmanındaki nöron sayısı (sınıf sayısı)
+activation = "softmax"                           # Dense katmanı aktivasyon fonksiyonu
+# Optimizasyon ve Eğitim Parametreleri
+loss = "sparse_categorical_crossentropy"         # Kayıp fonksiyonu
+optimizer = "adam"                               # Optimizasyon algoritması
+metrics = ["accuracy"]                           # Eğitim sırasında izlenecek başarı ölçütleri
+epochs = 20                                      # Eğitim döngüsü sayısı
+batch_size = 32                                  # Her eğitim adımında işlenecek örnek sayısı
+# === TransformerEncoder Sınıfı ===
+class TransformerEncoder(Layer):
+    def __init__(self, embed_dim, num_heads, feed_forward_dim, dropout_rate=0.1):
+        super(TransformerEncoder, self).__init__()
+        self.attention = MultiHeadAttention(num_heads=num_heads, key_dim=embed_dim)
+        self.dropout1 = Dropout(dropout_rate)
+        self.norm1 = LayerNormalization(epsilon=epsilon)
+        self.dense1 = Dense(feed_forward_dim, activation="relu")
+        self.dense2 = Dense(embed_dim)
+        self.dropout2 = Dropout(dropout_rate)
+        self.norm2 = LayerNormalization(epsilon=epsilon)
+    def call(self, inputs, training=None):
+        # Multi-Head Attention
+        attention_output = self.attention(inputs, inputs)
+        attention_output = self.dropout1(attention_output, training=training)
+        out1 = self.norm1(inputs + attention_output)  # Residual Connection
+        # Feed-Forward Network
+        dense_output = self.dense1(out1)
+        dense_output = self.dense2(dense_output)
+        dense_output = self.dropout2(dense_output, training=training)
+        return self.norm2(out1 + dense_output)  # Residual Connection
+# === Model Eğitimi ===
+def train_model(X, y, tokenizer):
+    nn_model = Sequential([
+        # Embedding katmanı
+        Embedding(input_dim=input_dim, output_dim=output_dim, input_length=input_length),
+        # LSTM Katmanları
+        *[LSTM(units, return_sequences=True, dropout=dropout_rate_rnn) for units in lstm_units[:-1]],
+        LSTM(lstm_units[-1], return_sequences=True, dropout=dropout_rate_rnn),
+        # GRU Katmanları
+        *[GRU(units, return_sequences=True, dropout=dropout_rate_rnn) for units in gru_units[:-1]],
+        GRU(gru_units[-1], return_sequences=False, dropout=dropout_rate_rnn),
+        # Dense Katmanı
+        Dense(dense_units, activation=activation)
+    ])
+    nn_model.compile(loss=loss, optimizer=optimizer, metrics=metrics)
+    print("Model eğitiliyor...")
+    nn_model.fit(X, y, epochs=epochs, batch_size=batch_size)
+    return nn_model
+# === Cümle Üretim Fonksiyonu ===
+def generate_sentence(model, tokenizer, start_word, sentence_length, temperature=1.0):
+    sentence = [start_word]
+    for _ in range(sentence_length - 1):
+        sequence = tokenizer.texts_to_sequences([' '.join(sentence)])
+        sequence = pad_sequences(sequence, maxlen=context_length, padding='post')
+        predicted_probs = model.predict(sequence)[0]
+        predicted_probs = np.asarray(predicted_probs).astype('float64')
+        predicted_probs = np.log(predicted_probs + 1e-10) / temperature
+        predicted_probs = np.exp(predicted_probs) / np.sum(np.exp(predicted_probs))
+        predicted_index = np.random.choice(len(predicted_probs), p=predicted_probs)
+        next_word = tokenizer.index_word.get(predicted_index, '')
+        if not next_word:
+            break
+        sentence.append(next_word)
+    return ' '.join(sentence)
+# === Veri İşleme ve Model Eğitim ===
+file_path = input("Veri setinin dosya yolunu giriniz: ")
+try:
+    with open(file_path, "r", encoding="utf-8") as f:
+        dataset = f.readlines()
+except FileNotFoundError:
+    print("Dosya bulunamadı!")
+    exit()
+tokenized_sentences = [re.findall(r'\b\w+\b', sentence.lower()) for sentence in dataset]
+word2vec_model = Word2Vec(tokenized_sentences, vector_size=vector_size, window=window_size, min_count=min_count, workers=max_worker)
+tokenizer = Tokenizer()
+tokenizer.fit_on_texts([' '.join(sentence) for sentence in tokenized_sentences])
+sequences = tokenizer.texts_to_sequences([' '.join(sentence) for sentence in tokenized_sentences])
+X = pad_sequences(sequences, maxlen=context_length, padding='post')
+y = np.array([seq[-1] if len(seq) > 0 else 0 for seq in sequences])
+model = train_model(X, y, tokenizer)
+# === Kullanıcıdan Girdi Al ve Cümle Üret ===
+start_word = input("Başlangıç kelimesi giriniz: ")
+print("\nÜretilen Cümle:", generate_sentence(model, tokenizer, start_word, sentence_length, temperature=1.0))