Spaces:

saichandrapandraju
/

make_more_names

Runtime error

App Files Files Community

saichandrapandraju commited on Jun 27, 2023

Commit

e81673f

1 Parent(s): cc7c5b8

implement Embedding Based Single Layer LM

Browse files

Files changed (2) hide show

app.py +33 -2
mlp.pt +0 -0

app.py CHANGED Viewed

@@ -14,6 +14,11 @@ def init_count_model():
 def init_single_layer_model():
     return torch.load("single_layer.pt")
 @st.cache_resource
 def init_char_index_mappings():
     with open("ctoi.json") as ci, open("itoc.json") as ic:
@@ -21,6 +26,7 @@ def init_char_index_mappings():
 count_p = init_count_model()
 single_layer_w = init_single_layer_model()
 ctoi, itoc = init_char_index_mappings()
 def predict_with_count(starting_char:str, num_words):
@@ -64,10 +70,35 @@ def predict_with_single_layer_nn(starting_char:str, num_words):
         output.append(''.join(out[:-1]))
     return output
 def predict(query, num_words):
     try:
-        preds = [predict_with_count(query, num_words), predict_with_single_layer_nn(query, num_words)]
-        labels = ["Count Based Language Model", "Single Linear Layer Language Model"]
         results = {labels[idx]: preds[idx] for idx in range(len(preds))}
         st.write(pd.DataFrame(results, index=range(num_words)))
     except ValueError as e:

 def init_single_layer_model():
     return torch.load("single_layer.pt")
+@st.cache_resource
+def init_mlp():
+    mlp_layers = torch.load("mlp.pt")
+    return mlp_layers["emb"], mlp_layers['w1'], mlp_layers['b1'], mlp_layers['w2'], mlp_layers['b2']
 @st.cache_resource
 def init_char_index_mappings():
     with open("ctoi.json") as ci, open("itoc.json") as ic:
 count_p = init_count_model()
 single_layer_w = init_single_layer_model()
+mlp_emb, mlp_w1, mlp_b1, mlp_w2, mlp_b2 = init_mlp()
 ctoi, itoc = init_char_index_mappings()
 def predict_with_count(starting_char:str, num_words):
         output.append(''.join(out[:-1]))
     return output
+def predict_with_mlp(starting_char:str, num_words):
+    g = torch.Generator().manual_seed(SEED)
+    output = []
+    context_length = 3
+    for _ in range(num_words):
+        out = []
+        context = [0]*(context_length-1)
+        if starting_char not in ctoi:
+            raise ValueError("Starting Character is not a valid alphabet. Please input a valid alphabet.")
+        ix = ctoi[starting_char]
+        out.append(starting_char)
+        context+=[ix]
+        while True:
+            emb = mlp_emb[torch.tensor([context])]
+            h = torch.tanh(emb.view(1,-1) @ mlp_w1 + mlp_b1)        # create batch_size 1
+            logits = h @ mlp_w2 + mlp_b2
+            probs = F.softmax(logits, dim=1)
+            ix = torch.multinomial(probs, num_samples=1, generator=g).item()
+            context = context[1:] + [ix]
+            out.append(itoc[str(ix)])
+            if ix == 0:
+                break
+        output.append(''.join(out[:-1]))
+    return output
 def predict(query, num_words):
     try:
+        preds = [predict_with_count(query, num_words), predict_with_single_layer_nn(query, num_words), predict_with_mlp(query, num_words)]
+        labels = ["Count Based LM", "Single Linear Layer LM", "Embedding Based Single Hidden Layer LM"]
         results = {labels[idx]: preds[idx] for idx in range(len(preds))}
         st.write(pd.DataFrame(results, index=range(num_words)))
     except ValueError as e:

mlp.pt ADDED Viewed

Binary file (49.3 kB). View file