google · ringgaard · Jan 11, 2020 · Jan 8, 2020 · Jan 10, 2020 · anders-sandholm
diff --git a/doc/guide/caspar.md b/doc/guide/caspar.md
@@ -57,11 +57,23 @@ import sling
 import sling.flags as flags
 import sling.task.workflow as workflow
 
-# Start up workflow system.
+flags.define("--accurate", default=False,action='store_true')
+
 flags.parse()
+
+if flags.arg.accurate:
+  modelfn = "local/data/e/caspar/caspar-accurate.flow"
+  rnn_layers = 3
+  rnn_dim = 192
+else:
+  modelfn = "local/data/e/caspar/caspar.flow"
+  rnn_layers = 1
+  rnn_dim = 128
+
+# Start up workflow system.
 workflow.startup()
 
-# Create worflow.
+# Create workflow.
 wf = workflow.Workflow("parser-training")
 
 # Parser trainer inputs and outputs.
@@ -80,23 +92,28 @@ word_embeddings = wf.resource(
   format="embeddings"
 )
 
-parser_model = wf.resource(
-  "local/data/e/caspar/caspar.flow",
-  format="flow"
-)
+parser_model = wf.resource(modelfn, format="flow")
 
 # Parser trainer task.
 trainer = wf.task("caspar-trainer")
 
 trainer.add_params({
+  "rnn_type": 1,
+  "rnn_dim": rnn_dim,
+  "rnn_highways": True,
+  "rnn_layers": rnn_layers,
+  "dropout": 0.2,
+  "ff_l2reg": 0.0001,
+
   "learning_rate": 1.0,
   "learning_rate_decay": 0.8,
   "clipping": 1,
   "optimizer": "sgd",
-  "epochs": 50000,
   "batch_size": 32,
   "rampup": 120,
-  "report_interval": 500
+  "report_interval": 1000,
+  "learning_rate_cliff": 40000,
+  "epochs": 50000,
 })
 
 trainer.attach_input("training_corpus", training_corpus)
@@ -111,9 +128,10 @@ workflow.run(wf)
 workflow.shutdown()
 ```
 
-This model takes ~90 minutes to train. It will output evaluation metrics
-each 500 epochs, and when it is done, the final parser model will be written
-to `local/data/e/caspar/caspar.flow`.
+This model takes ~30 minutes to train. It will output evaluation metrics
+each 1000 epochs, and when it is done, the final parser model will be written
+to `local/data/e/caspar/caspar.flow`. You can train a slightly more accurate,
+but much slower parser by using the `--accurate` flag.
 
 If you don't have access to OntoNotes 5, you can download a pre-trained model
 from [here](http://www.jbox.dk/sling/caspar.flow).
@@ -203,59 +221,73 @@ This tool takes the following commandline arguments:
    [... I sling/nlp/parser/tools/parse.cc:131] Load parser from local/data/e/caspar/caspar.flow
    [... I sling/nlp/parser/tools/parse.cc:140] 34.7368 ms loading parser
    [... I sling/nlp/parser/tools/parse.cc:235] Evaluating parser on local/data/corpora/caspar/dev.rec
-   SPAN_P+=76898
-   SPAN_P-=6800
-   SPAN_R+=76898
-   SPAN_R-=6192
-   SPAN_Precision=91.8755
-   SPAN_Recall=92.5478
-   SPAN_F1=92.2105
-   FRAME_P+=77866
-   FRAME_P-=5859
-   FRAME_R+=77859
-   FRAME_R-=5233
-   FRAME_Precision=93.0021
-   FRAME_Recall=93.7022
-   FRAME_F1=93.3508
-   TYPE_P+=74277
-   TYPE_P-=9448
-   TYPE_R+=74275
-   TYPE_R-=8817
-   TYPE_Precision=88.7154
-   TYPE_Recall=89.3889
-   TYPE_F1=89.0509
-   ROLE_P+=37762
-   ROLE_P-=16848
-   ROLE_R+=37755
-   ROLE_R-=16397
-   ROLE_Precision=69.1485
-   ROLE_Recall=69.7204
-   ROLE_F1=69.4333
+   SPAN_P+=77757
+   SPAN_P-=6185
+   SPAN_R+=77757
+   SPAN_R-=5333
+   SPAN_Precision=92.6318
+   SPAN_Recall=93.5817
+   SPAN_F1=93.1043
+   FRAME_P+=78724
+   FRAME_P-=5225
+   FRAME_R+=78715
+   FRAME_R-=4377
+   FRAME_Precision=93.776
+   FRAME_Recall=94.7323
+   FRAME_F1=94.2517
+   PAIR_P+=52597
+   PAIR_P-=2339
+   PAIR_R+=51988
+   PAIR_R-=2164
+   PAIR_Precision=95.7423
+   PAIR_Recall=96.0038
+   PAIR_F1=95.8729
+   EDGE_P+=44432
+   EDGE_P-=10504
+   EDGE_R+=44400
+   EDGE_R-=9752
+   EDGE_Precision=80.8796
+   EDGE_Recall=81.9914
+   EDGE_F1=81.4317
+   ROLE_P+=39836
+   ROLE_P-=15100
+   ROLE_R+=39826
+   ROLE_R-=14326
+   ROLE_Precision=72.5135
+   ROLE_Recall=73.5448
+   ROLE_F1=73.0255
+   TYPE_P+=75604
+   TYPE_P-=8345
+   TYPE_R+=75595
+   TYPE_R-=7497
+   TYPE_Precision=90.0594
+   TYPE_Recall=90.9775
+   TYPE_F1=90.5161
    LABEL_P+=0
    LABEL_P-=0
    LABEL_R+=0
    LABEL_R-=0
    LABEL_Precision=0
    LABEL_Recall=0
    LABEL_F1=0
-   SLOT_P+=112039
-   SLOT_P-=26296
-   SLOT_R+=112030
-   SLOT_R-=25214
-   SLOT_Precision=80.9911
-   SLOT_Recall=81.6283
-   SLOT_F1=81.3085
-   COMBINED_P+=266803
-   COMBINED_P-=38955
-   COMBINED_R+=266787
-   COMBINED_R-=36639
-   COMBINED_Precision=87.2595
-   COMBINED_Recall=87.9249
-   COMBINED_F1=87.591
+   SLOT_P+=115440
+   SLOT_P-=23445
+   SLOT_R+=115421
+   SLOT_R-=21823
+   SLOT_Precision=83.1191
+   SLOT_Recall=84.0991
+   SLOT_F1=83.6063
+   COMBINED_P+=271921
+   COMBINED_P-=34855
+   COMBINED_R+=271893
+   COMBINED_R-=31533
+   COMBINED_Precision=88.6383
+   COMBINED_Recall=89.6077
+   COMBINED_F1=89.1203
    #GOLDEN_SPANS=83090
-   #PREDICTED_SPANS=83698
+   #PREDICTED_SPANS=83942
    #GOLDEN_FRAMES=83092
-   #PREDICTED_FRAMES=83725
+   #PREDICTED_FRAMES=83949
    ```
 
 ## Using the CASPAR parser in Python

diff --git a/doc/guide/myelin.md b/doc/guide/myelin.md
@@ -380,6 +380,7 @@ var = <#flags> (IN=1, OUT=2, REF=4, LEARNABLE=8 UNIQUE=16, from version 5)
       <#aliases> <alias$>*
       <dtype$>
       <shape>
+      <#attrs> attr* (from version 6)
       <#bytes> value
 
 op = <#flags> (unused, from version 5)
@@ -411,7 +412,7 @@ dtype = "float16" | "float32" | "float64" | "int8" | "uint8" |
         "int16" | "uint16" | "int32" | "uint64"
 
 "flow" = 0x776f6c66
-version = 3 | 4 | 5
+version = 3 | 4 | 5 | 6
 ```
 
 A flow file begins with the _magic_ string "flow" followed by a version number.

diff --git a/python/myelin/builder.py b/python/myelin/builder.py
@@ -226,7 +226,7 @@ def varname(self, var):
       index += 1
 
   def concat(self, args, name=None):
-    op = self.rawop("ConcatV2", name)
+    op = self.rawop("Concat", name)
     shape = [args[0].shape[0], 0]
     for arg in args:
       op.add_input(arg)

diff --git a/python/myelin/flow.py b/python/myelin/flow.py
@@ -155,6 +155,7 @@ def __init__(self, name):
     self.aliases = []
     self.type = None
     self.shape = []
+    self.attrs = {}
     self.data = None
     self.producer = None
     self.consumers = []
@@ -214,6 +215,15 @@ def unique(self, value):
     else:
       self.flags &= ~16
 
+  def add_attr(self, name, value):
+    if type(value) is bool:
+      if value == True: value = 1
+      elif value == False: value = 0
+    self.attrs[name] = str(value)
+
+  def attr(self, name):
+    return self.attrs.get(name, None)
+
   def shape_defined(self):
     for d in self.shape:
       if d == -1: return False
@@ -560,7 +570,7 @@ def save(self, filename):
     # Write flow file header
     f = FileWriter(filename)
     f.write('flow')
-    f.write_int(5)
+    f.write_int(6)
     f.write_int(self.flags)
 
     # Write variables.
@@ -574,6 +584,10 @@ def save(self, filename):
       f.write_string(var.type)
       f.write_int(len(var.shape))
       for d in var.shape: f.write_int(d)
+      f.write_int(len(var.attrs))
+      for a in var.attrs:
+        f.write_string(a)
+        f.write_string(op.attrs[a])
       f.write_object(var.data)
 
     # Write operations.
@@ -636,7 +650,7 @@ def load(self, filename):
     assert magic == memoryview(b'flow'), magic.tobytes()
 
     version = f.read_int()
-    assert version == 4 or version == 5, version
+    assert version == 4 or version == 5 or version == 6, version
     if version >= 5: self.flags = f.read_int()
 
     num_vars = f.read_int()
@@ -658,6 +672,12 @@ def load(self, filename):
         shape.append(f.read_int())
       var = self.var(name, type=t, shape=shape)
       var.flags = flags
+      if version >= 6:
+        num_attr = f.read_int()
+        for _ in range(num_attr):
+          attr_name = f.read_string()
+          attr_val = f.read_string()
+          var.add_attr(attr_name, attr_val)
       size = f.read_long()
       if size > 0:
         var.data = f.slice(size)  # avoid creating a copy

diff --git a/python/myelin/simulator.py b/python/myelin/simulator.py
@@ -218,7 +218,7 @@ def compute(flow, f, data):
       v[o[0]] = np.array(len(v[i[0]].shape))
     elif op.type == "Identity":
       v[o[0]] = v[i[0]]
-    elif op.type == "ConcatV2":
+    elif op.type == "Concat":
       n = int(op.attr("N"))
       axis = v[i[n]]
       seq = []

diff --git a/sling/base/registry.h b/sling/base/registry.h
@@ -192,7 +192,7 @@ template <class T> struct ComponentRegistry {
     Registrar *r = components;
     while (r != nullptr && strcmp(type, r->type()) != 0) r = r->next();
     if (r == nullptr) {
-      LOG(FATAL) << "Unknown " << name << " component: '" << type << "'.";
+      LOG(FATAL) << "Unknown " << name << " component: " << type;
     }
     return r;
   }

diff --git a/sling/file/posix.cc b/sling/file/posix.cc
@@ -271,7 +271,7 @@ class PosixFileSystem : public FileSystem {
     return Status::OK;
   }
 
-  Status FlushMappedMemory(void *data, size_t size) {
+  Status FlushMappedMemory(void *data, size_t size) override {
     if (msync(data, size, MS_SYNC) != 0) return IOError("msync", errno);
     return Status::OK;
   }