func main() { flag.Parse() if flag.NArg() != 1 && flag.NArg() != 2 { flag.Usage() os.Exit(1) } config := common.ReadConfigOrExit(flag.Arg(0)) transitionSystem, ok := common.TransitionSystems[config.Parser.System] if !ok { log.Fatalf("Unknown transition system: %s", config.Parser.System) } blasImpl, ok := blasImpls[*blas] if !ok { log.Fatalf("Unknown blas implementation: %s", *blas) } labelNumberer := common.ReadTransitionsOrExit(config.Parser.Transitions, transitionSystem) parseNetwork := common.ReadModelOrExit(config.Parser.Model, blasImpl) var morphNetwork *network.Network if len(config.Parser.MorphModel) != 0 { morphNetwork = common.ReadModelOrExit(config.Parser.MorphModel, blasImpl) } ilas := common.ReadIlasOrExit(config.Parser.Inputs) normalizer := common.ReadNormalizerOrExit(config.Parser.Normalisation) layerEmbeddings := common.MustReadAllEmbeddings(config.Embeddings) realizer := input.NewInputVectorRealizer(ilas, layerEmbeddings, normalizer) var guide system.Guide if morphNetwork != nil { log.Print("Using morphology") guide = network.NewMorphGuide(parseNetwork, morphNetwork, *labelNumberer, realizer) } else { guide = network.NewGuide(parseNetwork, *labelNumberer, realizer) } parser := system.NewGreedyParser(transitionSystem, guide) if *cpuprofile != "" { f, err := os.Create(*cpuprofile) if err != nil { log.Fatal(err) } pprof.StartCPUProfile(f) defer pprof.StopCPUProfile() } start := time.Now() run(parser) elapsed := time.Since(start) log.Printf("Parsing took %s", elapsed) }
func main() { flag.Parse() if flag.NArg() != 3 { flag.Usage() os.Exit(1) } config := common.ReadConfigOrExit(flag.Arg(0)) transitionSystem, ok := common.TransitionSystems[config.Parser.System] if !ok { log.Fatalf("Unknown transition system: %s", config.Parser.System) } oracleConstructor, ok := common.Oracles[config.Parser.System] if !ok { log.Fatalf("Unknown transition system: %s", config.Parser.System) } log.Printf("Transition system: %s", config.Parser.System) ilas := common.ReadIlasOrExit(config.Parser.Inputs) var labelNumberer *system.LabelNumberer if config.Parser.Transitions != "" { if _, err := os.Stat(config.Parser.Transitions); err == nil { log.Printf("Transitions filename %s exists, reusing...", config.Parser.Transitions) labelNumberer = common.ReadTransitionsOrExit(config.Parser.Transitions, transitionSystem) } } instanceWriter, err := os.Create(flag.Arg(2)) common.ExitIfError("Cannot open instance file for writing:", err) defer instanceWriter.Close() trainDataWriter := input.NewTrainDataWriter(instanceWriter) layerEmbeddings := common.MustReadAllEmbeddings(config.Embeddings) realizer := input.NewInputVectorRealizer(ilas, layerEmbeddings, nil) var collector *common.WritingCollector if labelNumberer == nil { collector = common.NewWritingCollector(realizer, trainDataWriter) } else { collector = common.NewWritingCollectorWithLabelNumberer(realizer, labelNumberer, trainDataWriter) } trainer := system.NewGreedyTrainer(transitionSystem, collector) f, err := os.Open(flag.Arg(1)) common.ExitIfError("Cannot open training data:", err) defer f.Close() log.Println("Creating training instances...") common.ProcessData(f, func(s []conllx.Token) error { goldDependencies, err := system.SentenceToDependencies(s) if err != nil { return fmt.Errorf("Cannot extract dependencies: %s", err.Error()) } trainer.Parse(s, oracleConstructor(goldDependencies)) return nil }) if err != nil { common.ExitIfError("Cannot process data:", err) } if config.Parser.Transitions != "" { if _, err := os.Stat(config.Parser.Transitions); err != nil { writeTransitions(transitionSystem, collector.LabelNumberer(), config.Parser.Transitions) } } }