Improve gpt2 demo script

Bycob · Bycob · commit 881249ce440e · 2019-09-26T18:02:34.000+02:00
diff --git a/demo/gpt2/run_gpt2.py b/demo/gpt2/run_gpt2.py
@@ -1,3 +1,4 @@
+import random
 import sys
 import argparse
 from dd_client import DD
@@ -6,8 +7,10 @@
 parser.add_argument("-r", "--repository", required=True, help="Model repository")
 parser.add_argument("--host", type=str, default="localhost")
 parser.add_argument("--port", type=int, default=8080)
-parser.add_argument("--cpu", action='store_true')
+parser.add_argument("--cpu", action='store_true', help="Force model to run on CPU")
 parser.add_argument("--input-size", type=int, default=512)
+parser.add_argument("--topk", type=int, default=5, help="How many top predictions should be considered to chose the next token.")
+parser.add_argument("--temperature", type=float, default=1, help="Temperature of the predictions. The higher, the 'randomer'.")
 
 args = parser.parse_args()
 
@@ -41,9 +44,32 @@
     data = [prompt]
     parameters_input = {'word_start': "Ġ", 'suffix_start': ""}
     parameters_mllib = {}
-    parameters_output = {'best':3}
+    parameters_output = {'best':args.topk}
     result = dd.post_predict(sname, data, parameters_input,parameters_mllib,parameters_output)
-    word = result['body']['predictions'][0]['classes'][0]['cat'].replace("Ġ", " ").replace("Ċ", "\n")
-    print(word, sep='', end='')
+
+    # Select result from the returned tokens
+    word_probs = list()
+    total_probs = 0
+
+    for cls in result['body']['predictions'][0]['classes']:
+        word = cls['cat'].replace("Ġ", " ")
+        # dede does not support \n character well, so we don't select tokens containing a new line
+        if 'Ċ' in word:
+            continue
+
+        prob = pow(cls['prob'], args.temperature)
+        total_probs += prob
+        word_probs.append((word, prob))
+    
+    selector = random.uniform(0, total_probs)
+    total_probs = 0
+
+    for word, prob in word_probs:
+        total_probs += prob
+        if total_probs > selector:
+            selected_word = word
+            break
+
+    print(selected_word, sep='', end='')
     sys.stdout.flush()
-    prompt += word
+    prompt += selected_word